To compare the performance of varKode to Skmer, we will use leave-one-out cross validation: we remove one sample from the dataset, train a varKode model or make a skmer reference with the remaining samples, and then use the sample left out as query. We then record whether or not we correctly identify this sample in varKoder, and whether or not the closest sample with Skmer has the same identification.

For traditional barcodes, we assembled the genome of each sample, and then used BLAST to search for each of the traditional barcode genes. We recorded if we could find this gene in the assembly, coding as missing data if we could not. We then recorded whether the best BLAST hit for a sample was the correct species.

rm(list=ls())
library(tidyverse)
── Attaching core tidyverse packages ─────────────────────────────────── tidyverse 2.0.0 ──
✔ dplyr     1.1.2     ✔ readr     2.1.4
✔ forcats   1.0.0     ✔ stringr   1.5.0
✔ ggplot2   3.4.3     ✔ tibble    3.2.1
✔ lubridate 1.9.2     ✔ tidyr     1.3.0
✔ purrr     1.0.2     ── Conflicts ───────────────────────────────────────────────────── tidyverse_conflicts() ──
✖ dplyr::filter() masks stats::filter()
✖ dplyr::lag()    masks stats::lag()
ℹ Use the ]8;;http://conflicted.r-lib.org/conflicted package]8;; to force all conflicts to become errors
library(future)
library(ggthemes)
library(patchwork)
library(cowplot)

Attaching package: ‘cowplot’

The following object is masked from ‘package:patchwork’:

    align_plots

The following object is masked from ‘package:ggthemes’:

    theme_map

The following object is masked from ‘package:lubridate’:

    stamp
library(patchwork)
library(phytools)
Loading required package: ape

Attaching package: ‘ape’

The following object is masked from ‘package:dplyr’:

    where

Loading required package: maps

Attaching package: ‘maps’

The following object is masked from ‘package:purrr’:

    map
library(ape)
rm(list=ls())
library(tidyverse)
library(future)
library(ggthemes)
library(patchwork)
library(cowplot)
library(patchwork)
library(phytools)
library(ape)

VarKoder

For VarKoder, we used leave-one-out cross-validation to test the accuracy for family, genera, species in the joint Malpighiaceae-Chrysobalanaceae dataset. We used as input data varKodes produced from kmers of size 7 and 500Kbp to 200Mbp of data, or all of the data available if less than 200 Mbp. For each sample, we built a model using as input data from all other samples. Then we queried the sample left out, using as input the images generated from 500Kb to the total data available. Now we will summarize the results.

Accuracy vs data amount and taxonomic levels

In this test, we used varKoder v0.6.0. Let’s process the results.

read_and_process_xval = function(infolder){
  plan(multisession(workers = 12))
varkoder_results = list.files(infolder,
                                      'predictions.csv',
                                      recursive=T,
                                      full.names = T) %>%
  furrr::future_map_dfr(~read_csv(.x) %>% mutate(sample_id = as.character(sample_id))) %>% 
  select(-1) %>%
  filter(str_detect(query_basepairs,'^0+[125]0+K$')) %>% #we will ignore queries that are not standardized sizes
  rename(query_bp = query_basepairs) %>%
  mutate(quality_included = T)
plan(sequential)

all_taxlabels = str_remove(varkoder_results$actual_labels,";*low_quality:True;*") %>% str_split(';') %>% unlist %>% unique

varkoder_results = varkoder_results %>%
  mutate(query_labels = str_remove(actual_labels,";*low_quality:True;*") %>% str_split(';'),
         predicted_list = str_split(predicted_labels,';')
         ) %>%
  rowwise() %>%
  mutate(family_correct = query_labels[str_detect(query_labels,'family')] %in% predicted_list,
         genus_correct = query_labels[str_detect(query_labels,'genus')] %in% predicted_list,
         species_correct = ifelse(any(str_detect(query_labels,'species')),
                                  query_labels[str_detect(query_labels,'species')] %in% predicted_list,
                                  NA
                                  ),
         family_incorrect = any(!(predicted_list[str_detect(predicted_list,'family')] %in% query_labels[str_detect(query_labels,'family')])),
         genus_incorrect = any(!(predicted_list[str_detect(predicted_list,'genus')] %in% query_labels[str_detect(query_labels,'genus')])),
         species_incorrect = ifelse(any(str_detect(query_labels,'species')),
                                  any(!(predicted_list[str_detect(predicted_list,'species')] %in% query_labels[str_detect(query_labels,'species')])),
                                  NA
                                  )
         
         )

return(varkoder_results)
}
read_and_process_xval = function(infolder){
  plan(multisession(workers = 12))
varkoder_results = list.files(infolder,
                                      'predictions.csv',
                                      recursive=T,
                                      full.names = T) %>%
  furrr::future_map_dfr(~read_csv(.x) %>% mutate(sample_id = as.character(sample_id))) %>% 
  select(-1) %>%
  filter(str_detect(query_basepairs,'^0+[125]0+K$')) %>% #we will ignore queries that are not standardized sizes
  rename(query_bp = query_basepairs) %>%
  mutate(quality_included = T)
plan(sequential)

all_taxlabels = str_remove(varkoder_results$actual_labels,";*low_quality:True;*") %>% str_split(';') %>% unlist %>% unique

varkoder_results = varkoder_results %>%
  mutate(query_labels = str_remove(actual_labels,";*low_quality:True;*") %>% str_split(';'),
         predicted_list = str_split(predicted_labels,';')
         ) %>%
  rowwise() %>%
  mutate(family_correct = query_labels[str_detect(query_labels,'family')] %in% predicted_list,
         genus_correct = query_labels[str_detect(query_labels,'genus')] %in% predicted_list,
         species_correct = ifelse(any(str_detect(query_labels,'species')),
                                  query_labels[str_detect(query_labels,'species')] %in% predicted_list,
                                  NA
                                  ),
         family_incorrect = any(!(predicted_list[str_detect(predicted_list,'family')] %in% query_labels[str_detect(query_labels,'family')])),
         genus_incorrect = any(!(predicted_list[str_detect(predicted_list,'genus')] %in% query_labels[str_detect(query_labels,'genus')])),
         species_incorrect = ifelse(any(str_detect(query_labels,'species')),
                                  any(!(predicted_list[str_detect(predicted_list,'species')] %in% query_labels[str_detect(query_labels,'species')])),
                                  NA
                                  )
         
         )

return(varkoder_results)
}
summarize_results = function(res,level){
  res = res %>%
    ungroup() %>%
    mutate(low_quality = str_detect(actual_labels,"low_quality:True"),
           result = as.character(ifelse(res[,str_c(level,'correct',sep='_')] & !res[,str_c(level,'incorrect',sep='_')], 'correct',
                           ifelse(res[,str_c(level,'correct',sep='_')] & res[,str_c(level,'incorrect',sep='_')], 'ambiguous',
                                  ifelse(!res[,str_c(level,'correct',sep='_')]  & res[,str_c(level,'incorrect',sep='_')], 'incorrect',
                                                 'inconclusive'
                                  ))))
           ) %>%
    filter(!is.na(result)) %>%
    group_by(query_bp,result) %>%
    summarise(N=n(), .groups = 'drop') %>%
    group_by(query_bp) %>%
    mutate(p= N/sum(N)) %>%
    mutate(query_bp = as.integer(str_remove(query_bp,'K'))*1000) %>%
    ungroup() %>%
    mutate(query_bp = as.factor(query_bp)) %>%
    complete(query_bp,result, fill = list(p = 0, N = 0)) %>%
    mutate(query_bp = as.numeric(as.character(query_bp))) %>%
    ungroup()
    
  return(res)
}
summarize_results = function(res,level){
  res = res %>%
    ungroup() %>%
    mutate(low_quality = str_detect(actual_labels,"low_quality:True"),
           result = as.character(ifelse(res[,str_c(level,'correct',sep='_')] & !res[,str_c(level,'incorrect',sep='_')], 'correct',
                           ifelse(res[,str_c(level,'correct',sep='_')] & res[,str_c(level,'incorrect',sep='_')], 'ambiguous',
                                  ifelse(!res[,str_c(level,'correct',sep='_')]  & res[,str_c(level,'incorrect',sep='_')], 'incorrect',
                                                 'inconclusive'
                                  ))))
           ) %>%
    filter(!is.na(result)) %>%
    group_by(query_bp,result) %>%
    summarise(N=n(), .groups = 'drop') %>%
    group_by(query_bp) %>%
    mutate(p= N/sum(N)) %>%
    mutate(query_bp = as.integer(str_remove(query_bp,'K'))*1000) %>%
    ungroup() %>%
    mutate(query_bp = as.factor(query_bp)) %>%
    complete(query_bp,result, fill = list(p = 0, N = 0)) %>%
    mutate(query_bp = as.numeric(as.character(query_bp))) %>%
    ungroup()
    
  return(res)
}
plot_area = function(sum_df, title, relative = FALSE, grid = TRUE, xlim_all = TRUE){
  breaks = c(500000,
             1000000,
             2000000,
             5000000,
             10000000,
             20000000,
             50000000,
             100000000,
             200000000
             )
  if (xlim_all){
    xlimits = range(breaks)
  } else {
    xlimits = range(sum_df$query_bp)
  }
  
  
  sum_df = sum_df %>%
    mutate(result = factor(result,ordered = T, levels = c('correct','ambiguous','inconclusive','incorrect'))) 
  if (relative){
    ylimits = c(0,1)
  } else {
    ylimits = c(0,sum_df %>% group_by(query_bp) %>% summarize(N=sum(N)) %>% pull(N) %>% max)
  }
  
  
  # Get colors from a Color Brewer palette
  brewer_colors <- RColorBrewer::brewer.pal(4, "Accent")
  
  if (relative) {
    p1 = ggplot(sum_df, aes(x=query_bp,y=p,fill=result)) +
    geom_area(position='stack') +
    scale_fill_manual(values = setNames(brewer_colors, c("correct", "ambiguous", "inconclusive", "incorrect"))) +
    scale_alpha_manual(values=c(0.5,1)) +
    scale_x_log10(labels = scales::label_number(scale_cut = scales::cut_si('bp')),breaks = breaks)  +
    scale_y_continuous() +
    ggtitle(title) +
    ylab('Fraction of samples') +
    xlab('Base pairs in query images') +
    theme_few() +
    theme(axis.text.x = element_text(hjust=1,angle=45))
  } else {
      p1 = ggplot(sum_df, aes(x=query_bp,y=N,fill=result)) +
    geom_area(position='stack') +
    scale_fill_manual(values = setNames(brewer_colors, c("correct", "ambiguous", "inconclusive", "incorrect"))) +
    scale_alpha_manual(values=c(0.5,1)) +
    scale_x_log10(labels = scales::label_number(scale_cut = scales::cut_si('bp')),breaks = breaks)   +
    scale_y_continuous() +
    ggtitle(title) +
    ylab('Number of samples') +
    xlab('Base pairs in query images') +
    theme_few() +
    theme(axis.text.x = element_text(hjust=1,angle=45))
  }
  
  if (grid){
    p1 = p1 +
      scale_y_continuous(n.breaks = 10, minor_breaks = waiver()) +
      theme(panel.background = element_rect(fill = NA),
            panel.grid.major.y = element_line(colour = gray(0.5)),
            panel.grid.minor.y = element_line(colour = gray(0.6),linetype = 2),
            panel.ontop = TRUE)
  }
  
  p1 = p1 + coord_cartesian(xlim=xlimits, ylim=ylimits,expand = FALSE)
  
  return(p1)
}
  
plot_area = function(sum_df, title, relative = FALSE, grid = TRUE, xlim_all = TRUE){
  breaks = c(500000,
             1000000,
             2000000,
             5000000,
             10000000,
             20000000,
             50000000,
             100000000,
             200000000
             )
  if (xlim_all){
    xlimits = range(breaks)
  } else {
    xlimits = range(sum_df$query_bp)
  }
  
  
  sum_df = sum_df %>%
    mutate(result = factor(result,ordered = T, levels = c('correct','ambiguous','inconclusive','incorrect'))) 
  if (relative){
    ylimits = c(0,1)
  } else {
    ylimits = c(0,sum_df %>% group_by(query_bp) %>% summarize(N=sum(N)) %>% pull(N) %>% max)
  }
  
  
  # Get colors from a Color Brewer palette
  brewer_colors <- RColorBrewer::brewer.pal(4, "Accent")
  
  if (relative) {
    p1 = ggplot(sum_df, aes(x=query_bp,y=p,fill=result)) +
    geom_area(position='stack') +
    scale_fill_manual(values = setNames(brewer_colors, c("correct", "ambiguous", "inconclusive", "incorrect"))) +
    scale_alpha_manual(values=c(0.5,1)) +
    scale_x_log10(labels = scales::label_number(scale_cut = scales::cut_si('bp')),breaks = breaks)  +
    scale_y_continuous() +
    ggtitle(title) +
    ylab('Fraction of samples') +
    xlab('Base pairs in query images') +
    theme_few() +
    theme(axis.text.x = element_text(hjust=1,angle=45))
  } else {
      p1 = ggplot(sum_df, aes(x=query_bp,y=N,fill=result)) +
    geom_area(position='stack') +
    scale_fill_manual(values = setNames(brewer_colors, c("correct", "ambiguous", "inconclusive", "incorrect"))) +
    scale_alpha_manual(values=c(0.5,1)) +
    scale_x_log10(labels = scales::label_number(scale_cut = scales::cut_si('bp')),breaks = breaks)   +
    scale_y_continuous() +
    ggtitle(title) +
    ylab('Number of samples') +
    xlab('Base pairs in query images') +
    theme_few() +
    theme(axis.text.x = element_text(hjust=1,angle=45))
  }
  
  if (grid){
    p1 = p1 +
      scale_y_continuous(n.breaks = 10, minor_breaks = waiver()) +
      theme(panel.background = element_rect(fill = NA),
            panel.grid.major.y = element_line(colour = gray(0.5)),
            panel.grid.minor.y = element_line(colour = gray(0.6),linetype = 2),
            panel.ontop = TRUE)
  }
  
  p1 = p1 + coord_cartesian(xlim=xlimits, ylim=ylimits,expand = FALSE)
  
  return(p1)
}
  

Now let’s plot genus-level accuracy for a model taking quality labels into account:

results = read_and_process_xval('Malpighiaceae+Chrysobalanaceae/varKoder/vit_results/')
summary_genus = summarize_results(results,'genus')
p_genus = plot_area(summary_genus, 'varKoder genus', relative = TRUE)
p_genus

Now the same but with species

summary_species = summarize_results(results,'species')
p_species = plot_area(summary_species, 'varKoder species', relative = TRUE)
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_species

Finally, family

summary_family = summarize_results(results,'family')
p_family = plot_area(summary_family, 'varKoder family', relative = TRUE)
p_family

what explains the errors?

Now we will try to identify which samples failed and why they failed. Particuarly, how do DNA quality, amount of data, and the number of samples per class impact results? We will use genus-level predictions to test.

genus_predictions = results %>%
  mutate(predicted_genus = str_extract(predicted_labels, 'genus:[^;]*'),
         actual_genus = str_extract(actual_labels, 'genus:[^;]*')) %>%
  select(-starts_with('family'),-starts_with('species')) %>%
  pivot_longer(cols = starts_with("genus"), names_to = "predicted_label", values_to = "confidence") %>%
  filter(actual_genus == predicted_label) %>%
  select(query_bp, sample_id, basefrequency_sd, actual_genus, confidence) %>%
  mutate(query_bp = 1000*(str_remove(query_bp, "K") %>% as.integer))

genus_predictions = genus_predictions %>%
  select(sample_id, actual_genus) %>%
  distinct() %>%
  group_by(actual_genus) %>%
  summarise(N_samples = n()) %>%
  right_join(genus_predictions)
Joining with `by = join_by(actual_genus)`
genus_predictions

Now let’s make some plots. First, what is the effect of number of samples per class in confidence?

plot_genus_N_vs_conf = ggplot(genus_predictions, aes(x = N_samples-1, 
                              y = confidence)) + 
  scale_color_viridis_c() +
  geom_jitter(alpha=0.3) + 
  scale_x_log10() +
  #ylab('Confidence in correct prediction\n(logit scale)') +
  ylab('Confidence in correct prediction') +
  xlab('Number of samples in correct genus\n(log scale)') +
  #scale_y_continuous(trans = "logit", breaks = c(1e-4,0.001,0.01,0.1,0.25,0.5,0.75,0.9,0.99,0.999,1-1e-4)) +
  scale_y_continuous(limits=c(0,1)) +
  theme_few() +
  theme(panel.grid.major.y = element_line(colour = gray(0.8)))

plot_genus_N_vs_conf

Now, what is the effect of sample quality in confidence?

plot_genus_freqsd_vs_conf = ggplot(genus_predictions, aes(x = basefrequency_sd, y = confidence)) + 
  geom_point(alpha=0.3) + 
  scale_x_log10() +
  #scale_y_continuous(trans = "logit", breaks = c(1e-4,0.001,0.01,0.1,0.25,0.5,0.75,0.9,0.99,0.999,1-1e-4)) +
  scale_y_continuous(limits=c(0,1)) +
  #ylab('Confidence in correct prediction\n(logit scale)') +
  ylab('Confidence in correct prediction') +
  xlab('Standard deviation of base frequencies') +
  theme_few() +
  theme(panel.grid.major.y = element_line(colour = gray(0.8)))

plot_genus_freqsd_vs_conf

Now, what is the effect of amount of data in confidence?

plot_genus_bp_vs_conf = ggplot(genus_predictions, aes(x = query_bp, y = confidence)) + 
  geom_jitter(alpha=0.3) + 
  #scale_y_continuous(trans = "logit", breaks = c(1e-4,0.001,0.01,0.1,0.25,0.5,0.75,0.9,0.99,0.999,1-1e-4)) +
  scale_y_continuous(limits=c(0,1)) +
  #ylab('Confidence in correct prediction\n(logit scale)') +
  ylab('Confidence in correct prediction') +
  xlab('Base pairs in query images\n(log scale)') +
  scale_x_log10() +
  theme_few() +
  theme(panel.grid.major.y = element_line(colour = gray(0.8)))

plot_genus_bp_vs_conf

Now let’s save the three of them as a single plot using cowplot.

combined_conf = patchwork::wrap_plots(plot_genus_N_vs_conf + theme(text = element_text(size=8)),
                                      plot_genus_bp_vs_conf + theme(axis.title.y=element_blank(), 
                                                                    axis.text.y=element_blank(), 
                                                                    text = element_text(size=8)),
                                      plot_genus_freqsd_vs_conf + theme(axis.title.y=element_blank(), 
                                                                        axis.text.y=element_blank(),
                                                                        text = element_text(size=8))) +
  patchwork::plot_annotation(tag_levels = 'A') 

combined_conf

ggsave(filename = 'images_manuscript/supp_conf_predictors.pdf',device = 'pdf',width = 7,height=3,units = 'in',useDingbats=F)

Let’s put it all together now in a linear model:

lm_data = genus_predictions %>%
  mutate(confidence = ifelse(confidence == 1, confidence-0.0000001, confidence),
         confidence = car::logit(confidence)) %>%
  mutate(query_bp = (query_bp - mean(query_bp))/sd(query_bp),
         basefrequency_sd = (basefrequency_sd - mean(basefrequency_sd))/sd(basefrequency_sd),
         N_samples = (N_samples - mean(N_samples))/sd(N_samples)
         ) 

full_model = lm(formula = confidence~query_bp*basefrequency_sd*N_samples, data = lm_data) 
full_model

Call:
lm(formula = confidence ~ query_bp * basefrequency_sd * N_samples, 
    data = lm_data)

Coefficients:
                        (Intercept)                             query_bp  
                            4.92334                              0.16749  
                   basefrequency_sd                            N_samples  
                           -0.58514                              1.67950  
          query_bp:basefrequency_sd                   query_bp:N_samples  
                            0.24651                              0.01799  
         basefrequency_sd:N_samples  query_bp:basefrequency_sd:N_samples  
                            0.01540                              0.02975  
summary(full_model)

Call:
lm(formula = confidence ~ query_bp * basefrequency_sd * N_samples, 
    data = lm_data)

Residuals:
     Min       1Q   Median       3Q      Max 
-16.1052  -1.1535   0.2901   1.4519   5.8115 

Coefficients:
                                    Estimate Std. Error t value Pr(>|t|)    
(Intercept)                          4.92334    0.05383  91.468  < 2e-16 ***
query_bp                             0.16749    0.07211   2.323   0.0203 *  
basefrequency_sd                    -0.58514    0.10373  -5.641  1.9e-08 ***
N_samples                            1.67950    0.05676  29.589  < 2e-16 ***
query_bp:basefrequency_sd            0.24651    0.18896   1.305   0.1922    
query_bp:N_samples                   0.01799    0.07770   0.232   0.8169    
basefrequency_sd:N_samples           0.01540    0.12390   0.124   0.9011    
query_bp:basefrequency_sd:N_samples  0.02975    0.22380   0.133   0.8943    
---
Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

Residual standard error: 2.217 on 2251 degrees of freedom
Multiple R-squared:  0.4317,    Adjusted R-squared:  0.4299 
F-statistic: 244.3 on 7 and 2251 DF,  p-value: < 2.2e-16
plot(full_model)

reduced_model = step(full_model, direction ="both")
Start:  AIC=3604.28
confidence ~ query_bp * basefrequency_sd * N_samples

                                      Df Sum of Sq   RSS    AIC
- query_bp:basefrequency_sd:N_samples  1  0.086829 11060 3602.3
<none>                                             11060 3604.3

Step:  AIC=3602.29
confidence ~ query_bp + basefrequency_sd + N_samples + query_bp:basefrequency_sd + 
    query_bp:N_samples + basefrequency_sd:N_samples

                                      Df Sum of Sq   RSS    AIC
- basefrequency_sd:N_samples           1    0.0044 11060 3600.3
- query_bp:N_samples                   1    0.2090 11060 3600.3
<none>                                             11060 3602.3
- query_bp:basefrequency_sd            1   14.9441 11075 3603.3
+ query_bp:basefrequency_sd:N_samples  1    0.0868 11060 3604.3

Step:  AIC=3600.29
confidence ~ query_bp + basefrequency_sd + N_samples + query_bp:basefrequency_sd + 
    query_bp:N_samples

                             Df Sum of Sq   RSS    AIC
- query_bp:N_samples          1    0.2053 11060 3598.3
<none>                                    11060 3600.3
- query_bp:basefrequency_sd   1   15.0305 11075 3601.4
+ basefrequency_sd:N_samples  1    0.0044 11060 3602.3

Step:  AIC=3598.34
confidence ~ query_bp + basefrequency_sd + N_samples + query_bp:basefrequency_sd

                             Df Sum of Sq   RSS    AIC
<none>                                    11060 3598.3
- query_bp:basefrequency_sd   1      14.8 11075 3599.4
+ query_bp:N_samples          1       0.2 11060 3600.3
+ basefrequency_sd:N_samples  1       0.0 11060 3600.3
- N_samples                   1    5986.7 17047 4573.6
reduced_model

Call:
lm(formula = confidence ~ query_bp + basefrequency_sd + N_samples + 
    query_bp:basefrequency_sd, data = lm_data)

Coefficients:
              (Intercept)                   query_bp           basefrequency_sd  
                   4.9219                     0.1652                    -0.5959  
                N_samples  query_bp:basefrequency_sd  
                   1.6755                     0.2246  
summary(reduced_model)

Call:
lm(formula = confidence ~ query_bp + basefrequency_sd + N_samples + 
    query_bp:basefrequency_sd, data = lm_data)

Residuals:
     Min       1Q   Median       3Q      Max 
-16.1127  -1.1572   0.2955   1.4482   5.8153 

Coefficients:
                          Estimate Std. Error t value Pr(>|t|)    
(Intercept)                4.92189    0.04832 101.855  < 2e-16 ***
query_bp                   0.16518    0.05680   2.908  0.00367 ** 
basefrequency_sd          -0.59594    0.06579  -9.058  < 2e-16 ***
N_samples                  1.67552    0.04797  34.929  < 2e-16 ***
query_bp:basefrequency_sd  0.22460    0.12921   1.738  0.08230 .  
---
Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

Residual standard error: 2.215 on 2254 degrees of freedom
Multiple R-squared:  0.4317,    Adjusted R-squared:  0.4307 
F-statistic:   428 on 4 and 2254 DF,  p-value: < 2.2e-16
plot(reduced_model)

Skmer

For skmer, we left each sample out, built a reference and then queried that sample. We have several files in which reference samples are ordered by their distance to the query, we here we will evaluate whether the closest sample is from the correct species or genus.

Because it is not clear how skmer behaves for different levels of coverage, we repeated this for several input sizes (in number of basepairs) as query, but always used the maximum input dize available (up to 200Mb) for references.

Let’s make a function that extracts these results as a table.


samp_labels = results %>% select(sample_id,actual_labels) %>% distinct()

extract_skmer_results = function(file_path) {
    # Read only the first 2 lines of the file
    file_lines <- readLines(file_path, n = 2)
    
    # Extract sample_ID, basepairs from the first line
    sample_info <- str_match(file_lines[1], "\\s*(.*?)@(\\d+K)")[, 2:3]
    sample_ID <- sample_info[1]
    basepairs <- sample_info[2]
    
    # Extract reference_sample_ID, distance from the second line
    reference_info <- str_match(file_lines[2], "\\s*(.*?)@.*\\s+(\\d+\\.\\d+)")[, 2:3]
    reference_sample_ID <- reference_info[1]
    distance <- as.numeric(reference_info[2])
    
    # Create a tibble
    tibble(
        sample_id = sample_ID,
        query_bp = basepairs,
        closest_reference_sample_id = reference_sample_ID,
        closest_distance = distance
    ) 
}

Now we will apply this function to all skmer output files.

plan(multisession(workers = 12))
skmer_results_df = furrr::future_map_dfr(
  list.files('Malpighiaceae+Chrysobalanaceae/skmer/skmer_xval_results/', full.names = T),
  ~ extract_skmer_results(.x)
) %>%
  left_join(samp_labels, by = 'sample_id') %>%
  left_join(
    samp_labels %>% select(
      closest_reference_sample_id = 'sample_id',
      predicted_labels = actual_labels
    ),
    by = 'closest_reference_sample_id'
  ) %>%
  mutate(
    query_labels = str_remove(actual_labels, ";*low_quality:True;*") %>% str_split(';'),
    predicted_list = str_split(predicted_labels, ';')
  ) %>%
  rowwise() %>%
  mutate(
    family_correct = query_labels[str_detect(query_labels, 'family')] %in% predicted_list,
    genus_correct = query_labels[str_detect(query_labels, 'genus')] %in% predicted_list,
    species_correct = ifelse(any(str_detect(
      query_labels, 'species'
    )),
    query_labels[str_detect(query_labels, 'species')] %in% predicted_list,
    NA),
    family_incorrect = any(!(predicted_list[str_detect(predicted_list, 'family')] %in% query_labels[str_detect(query_labels, 'family')])),
    genus_incorrect = any(!(predicted_list[str_detect(predicted_list, 'genus')] %in% query_labels[str_detect(query_labels, 'genus')])),
    species_incorrect = ifelse(any(str_detect(
      query_labels, 'species'
    )),
    any(!(
      predicted_list[str_detect(predicted_list, 'species')] %in% query_labels[str_detect(query_labels, 'species')]
    )),
    NA)
    
  )
plan(sequential)
skmer_results_df

Now let’s summarize and plot by genus:

skmer_summary_genus = summarize_results(skmer_results_df,'genus')
p_skmer_genus = plot_area(skmer_summary_genus, 'Skmer genus', relative = TRUE)
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_skmer_genus

Now by species. In Skmer, there is no inconclusive result: if there is no correct species prediction, it means that a sample was predicted in the wrong genus and therefore it is incorrect

skmer_summary_species = summarize_results(skmer_results_df,'species') %>%
  mutate(result = ifelse(result == 'correct', 'correct','incorrect')) %>%
  group_by(query_bp,result) %>%
  summarise_all(sum)
p_skmer_species = plot_area(skmer_summary_species, 'Skmer species', relative = TRUE)
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_skmer_species

And now by family:

skmer_summary_family = summarize_results(skmer_results_df,'family')
skmer_summary_family 
p_skmer_family = plot_area(skmer_summary_family, 'Skmer family', relative = TRUE)
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_skmer_family

Traditional barcodes

BLAST single gene

Let’s now read the traditional barcode BLAST results and summarize them in the same way as skmer and varKoder. Let’s start by defining a fuction that reads the data so we can summarize it using the previously defined functions.

read_traditional_barcodes = function(bp) {
  input_file = paste0(
    'Malpighiaceae+Chrysobalanaceae/traditional_barcodes/2_blast_phylogeny_result/Genus/',
    bp,
    'M_blast_phylo_sum_sp.tsv'
  )
  
  barcode_res = read_delim(input_file) %>%
    pivot_longer(-sp, names_to = 'marker', values_to = 'closest_reference_sample_id') %>%
    rename(sample_id = 'sp') %>%
    mutate(
      sample_id = str_remove_all(sample_id, '@.+'),
      closest_reference_sample_id = str_remove_all(closest_reference_sample_id, '@.+'),
      predicted_labels = samp_labels$actual_labels[match(closest_reference_sample_id, samp_labels$sample_id)],
      actual_labels = samp_labels$actual_labels[match(sample_id, samp_labels$sample_id)]
    ) %>%
    filter(marker != 'Concatenated_phylogeny') %>%
    mutate(
      query_labels = str_remove(actual_labels, ";*low_quality:True;*") %>% str_split(';'),
      predicted_list = str_split(predicted_labels, ';')
    ) %>%
    rowwise() %>%
    mutate(
      family_correct = query_labels[str_detect(query_labels, 'family')] %in% predicted_list,
      genus_correct = query_labels[str_detect(query_labels, 'genus')] %in% predicted_list,
      species_correct = ifelse(any(str_detect(
        query_labels, 'species'
      )),
      query_labels[str_detect(query_labels, 'species')] %in% predicted_list,
      NA),
      family_incorrect = any(!(predicted_list[str_detect(predicted_list, 'family')] %in% query_labels[str_detect(query_labels, 'family')])),
      genus_incorrect = any(!(predicted_list[str_detect(predicted_list, 'genus')] %in% query_labels[str_detect(query_labels, 'genus')])),
      species_incorrect = ifelse(any(str_detect(
        query_labels, 'species'
      )),
      any(!(
        predicted_list[str_detect(predicted_list, 'species')] %in% query_labels[str_detect(query_labels, 'species')]
      )),
      NA)
    ) %>%
    mutate_at(vars(ends_with("_correct"), ends_with("_incorrect")),
              ~ ifelse(is.na(predicted_labels) & !is.na(.), FALSE, .)) %>%
    mutate(query_bp = bp * 1e3)
  
  return(barcode_res)
}

Now we can apply this function to all of our results:

results_barcodes = purrr::map_dfr(c(10,20,50,100,200),read_traditional_barcodes)
Rows: 288 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Rows: 285 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Rows: 267 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Rows: 200 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Rows: 166 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
results_barcodes

Now let’s summarise for each marker separately:

barcode_summary_family = split(results_barcodes,results_barcodes$marker) %>%
  purrr::map_dfr(~summarize_results(.x,'family'),.id='marker')

barcode_summary_family
barcode_summary_genus = split(results_barcodes,results_barcodes$marker) %>%
  purrr::map_dfr(~summarize_results(.x,'genus'),.id='marker')

barcode_summary_genus
barcode_summary_species = split(results_barcodes,results_barcodes$marker) %>%
  purrr::map_dfr(~summarize_results(.x,'species'),.id='marker')

barcode_summary_species

Now let’s plot, making separate plots for each marker:

Species:

p_barcode_species = barcode_summary_species %>%
  split(barcode_summary_species$marker) %>%
  purrr::map(~plot_area(.x,paste0(unique(.x$marker),' species'), relative = TRUE, xlim_all = FALSE))
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_barcode_species
$ITS

$matK

$ndhF

$rbcL

$`trnL-F`

Genera:

p_barcode_genus = barcode_summary_genus %>%
  split(barcode_summary_genus$marker) %>%
  purrr::map(~plot_area(.x,paste0(unique(.x$marker),' genus'), relative = TRUE, xlim_all = FALSE))
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_barcode_genus
$ITS

$matK

$ndhF

$rbcL

$`trnL-F`

Family:

p_barcode_family = barcode_summary_family %>%
  split(barcode_summary_family$marker) %>%
  purrr::map(~plot_area(.x,paste0(unique(.x$marker),' family'), relative = TRUE,xlim_all = FALSE))
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_barcode_family
$ITS

$matK

$ndhF

$rbcL

$`trnL-F`

Concatenated tree

Now we will do the same for concatenated tree. Let’s start by defining a function to gather results. We will consider a result as correct if the majority of the sister taxon to a tip has the same label.


read_concatenated_tree_results = function(bp){
  
  
# Read in your tree - replace 'your_tree_file.nwk' with the path to your tree file
tree = read.tree(paste0('Malpighiaceae+Chrysobalanaceae/traditional_barcodes/2_blast_phylogeny_result/Genus/conc.',bp,'m.spname.tre'))

#leave only sample IDs as tip labels
tree$tip.label = tree$tip.label %>% str_remove(".*@") %>% str_remove("'") %>% str_replace(' ref','_ref')

# Compute the patristic distances and list all reference names
patristic_distances <- cophenetic(tree)
all_ref_names = dimnames(patristic_distances)[[1]][str_detect(dimnames(patristic_distances)[[1]],'_ref$')]
all_nonref = dimnames(patristic_distances)[[1]][str_detect(dimnames(patristic_distances)[[1]],'_ref$',negate = TRUE)]

# For each tip, find the reference sample with closest patristic distance
find_closest = function(tip){
  to_keep = c(tip,all_ref_names[str_detect(all_ref_names,paste0(tip,'_ref'),negate = TRUE)])
  return(names(sort(patristic_distances[tip,to_keep])[2]) %>%
           str_remove('_ref'))
}

closest_match = purrr::map_chr(all_nonref,find_closest)

samples_with_data = read_delim(paste0('Malpighiaceae+Chrysobalanaceae/traditional_barcodes/2_blast_phylogeny_result/Genus/',bp,'M_blast_phylo_sum_sp.tsv')) %>% 
  select(sample_id=sp) %>%
  mutate(sample_id = str_remove_all(sample_id, '@.+'))

barcode_res = tibble(sample_id = all_nonref,
       closest_reference_sample_id = closest_match) %>%
  right_join(samples_with_data) %>%
  mutate(
      predicted_labels = samp_labels$actual_labels[match(closest_reference_sample_id, samp_labels$sample_id)],
      actual_labels = samp_labels$actual_labels[match(sample_id, samp_labels$sample_id)]
    ) %>%
  filter(sample_id!='2095') %>%
  mutate(
      query_labels = str_remove(actual_labels, ";*low_quality:True;*") %>% str_split(';'),
      predicted_list = str_split(predicted_labels, ';')
    ) %>%
    rowwise() %>%
    mutate(
      family_correct = query_labels[str_detect(query_labels, 'family')] %in% predicted_list,
      genus_correct = query_labels[str_detect(query_labels, 'genus')] %in% predicted_list,
      species_correct = ifelse(any(str_detect(
        query_labels, 'species'
      )),
      query_labels[str_detect(query_labels, 'species')] %in% predicted_list,
      NA),
      family_incorrect = any(!(predicted_list[str_detect(predicted_list, 'family')] %in% query_labels[str_detect(query_labels, 'family')])),
      genus_incorrect = any(!(predicted_list[str_detect(predicted_list, 'genus')] %in% query_labels[str_detect(query_labels, 'genus')])),
      species_incorrect = ifelse(any(str_detect(
        query_labels, 'species'
      )),
      any(!(
        predicted_list[str_detect(predicted_list, 'species')] %in% query_labels[str_detect(query_labels, 'species')]
      )),
      NA)
    ) %>%
    mutate_at(vars(ends_with("_correct"), ends_with("_incorrect")),
              ~ ifelse(is.na(predicted_labels) & !is.na(.), FALSE, .)) %>%
    mutate(query_bp = bp * 1e3)
  
  return(barcode_res)
}

Now let’s apply this function

results_concat_barcodes = purrr::map_dfr(c(10,20,50,100,200),read_concatenated_tree_results)
Rows: 288 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Joining with `by = join_by(sample_id)`Rows: 285 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Joining with `by = join_by(sample_id)`Rows: 267 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Joining with `by = join_by(sample_id)`Rows: 200 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Joining with `by = join_by(sample_id)`Rows: 166 Columns: 7── Column specification ───────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (7): sp, matK, rbcL, ndhF, trnL-F, ITS, Concatenated_phylogeny
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.Joining with `by = join_by(sample_id)`
results_concat_barcodes

Let’s summarize results and plot for genus, species and family accuracy

concat_summary_species = summarize_results(results_concat_barcodes,'species')
p_concat_species = plot_area(concat_summary_species, relative = FALSE,title = 'Concatenated barcodes species',xlim_all = FALSE)
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_concat_species

concat_summary_genus = summarize_results(results_concat_barcodes,'genus')
p_concat_genus = plot_area(concat_summary_genus, relative = TRUE,title = 'Concatenated barcodes genus',xlim_all = TRUE)
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_concat_genus

concat_summary_family = summarize_results(results_concat_barcodes,'family')
p_concat_family = plot_area(concat_summary_family, relative = TRUE,title = 'Concatenated barcodes family',xlim_all = FALSE)
Scale for y is already present.
Adding another scale for y, which will replace the existing scale.
p_concat_family

Direct comparison

Now let’s compare methods side by side. For genus level:

p1 = patchwork::wrap_plots(p_genus + theme(axis.text.x = element_blank(),
                                           axis.title.x = element_blank()), 
                   p_skmer_genus, ncol = 1) 
p2 = patchwork::wrap_plots(p_barcode_genus$ITS + theme(legend.position = 'none'),
                   p_barcode_genus$rbcL + theme(legend.position = 'none', 
                                                axis.title.y = element_blank(),
                                                axis.text.y = element_blank()),
                   p_concat_genus + theme(axis.title.y = element_blank(),
                                                axis.text.y = element_blank()),
                   nrow = 1)
p = patchwork::wrap_plots(p1,p2,ncol=1,heights = c(0.7,0.3)) +
  plot_annotation(title = 'Genus-level accuracy')
p

ggsave('images_manuscript/fig3_genus_accuracy.pdf', width=5,height = 10)
ggsave('images_manuscript/fig3_genus_accuracy.png', width=5,height = 10,dpi=1200)

Now for species level:

p1 = patchwork::wrap_plots(p_species + theme(axis.text.x = element_blank(),
                                           axis.title.x = element_blank()), 
                   p_skmer_species, ncol = 1) 
p2 = patchwork::wrap_plots(p_barcode_species$ITS + theme(legend.position = 'none'),
                   p_barcode_species$rbcL + theme(legend.position = 'none', 
                                                axis.title.y = element_blank(),
                                                axis.text.y = element_blank()),
                   p_concat_species + theme(axis.title.y = element_blank(),
                                                axis.text.y = element_blank()),
                   nrow = 1)
p = patchwork::wrap_plots(p1,p2,ncol=1,heights = c(0.7,0.3)) +
  plot_annotation(title = 'species-level accuracy')
p

ggsave('images_manuscript/fig3_species_accuracy.pdf', width=5,height = 10)
ggsave('images_manuscript/fig3_species_accuracy.png', width=5,height = 10,dpi=1200)

Now for family level:

p1 = patchwork::wrap_plots(p_family + theme(axis.text.x = element_blank(),
                                           axis.title.x = element_blank()), 
                   p_skmer_family, ncol = 1) 
p2 = patchwork::wrap_plots(p_barcode_family$ITS + theme(legend.position = 'none'),
                   p_barcode_family$rbcL + theme(legend.position = 'none', 
                                                axis.title.y = element_blank(),
                                                axis.text.y = element_blank()),
                   p_barcode_family$matK + theme(axis.title.y = element_blank(),
                                                axis.text.y = element_blank()),
                   nrow = 1)
p = patchwork::wrap_plots(p1,p2,ncol=1,heights = c(0.7,0.3)) +
  plot_annotation(title = 'family-level accuracy')
p
ggsave('images_manuscript/fig3_family_accuracy.pdf', width=5,height = 10)
ggsave('images_manuscript/fig3_family_accuracy.png', width=5,height = 10,dpi=1200)

Comparison of run times

Now let’s compare the time to produce references and to produce

SRA

Finally, let’s summarize results for the whole SRA dataset. In this case, we only have varKoder since Skmer cannot finish and traditional barcodes are inapplicable.

varKoder_SRA_results  = read_csv('all_SRA/varkoder_query_results/predictions.csv') %>%
select(-1) %>%
  filter(str_detect(query_basepairs,'^0+[125]0+K$')) %>% #we will ignore queries that are not standardized sizes
  rename(query_bp = query_basepairs) %>%
  mutate(quality_included = T)
plan(sequential)

SRA_taxlabels = str_remove(varKoder_SRA_results$actual_labels,";*low_quality:True;*") %>% str_split(';') %>% unlist %>% unique

varKoder_SRA_results = varKoder_SRA_results %>%
  mutate(query_labels = str_remove(actual_labels,";*low_quality:True;*") %>% str_split(';') %>% unlist,
         predicted_list = str_split(predicted_labels,';')
         ) %>%
  rowwise() %>%
  mutate(family_correct = query_labels %in% predicted_list,
         family_incorrect = ifelse(is.na(predicted_labels),FALSE,any(!(predicted_list %in% query_labels)))) %>%
 select(matches("^[^0-9]"))

varKoder_SRA_results 
         

Now let’s summarize and plot:

SRA_summary_family = summarize_results(varKoder_SRA_results,'family')
SRA_summary_family

N_samp = SRA_summary_family %>%
 group_by(query_bp) %>%
 summarise(N = sum(N))

p_SRA_family = plot_area(SRA_summary_family, 'varKoder SRA family', relative = TRUE) 
p_SRA_family 

Let’s now do the SRA plot, but splitting by kingdom. First, we need to retrieve kingdom information:


p_SRA_families = read_csv('all_SRA/runs_to_download_data.csv') %>%
  select(sample_id = Run, Kingdom) %>%
  right_join(varKoder_SRA_results) %>%
  split(.$Kingdom) %>%
  purrr::map(summarize_results, 
                 level='family') %>%
  purrr::imap(~plot_area(.x,.y,relative=TRUE) + coord_cartesian(xlim=c(500,10000)*1000,expand = FALSE))

p_SRA_families

Now let’s join to create a plot for publication:

remove_y_axis_and_scale = function(x){
  x +
    theme(axis.title.y = element_blank(),
          axis.text.y = element_blank(),
          axis.ticks.y = element_blank(),
          legend.position='none',
          axis.title.x = element_blank())
}

# Modify the last plot to have the x-axis label
p_SRA_families$Fungi <- p_SRA_families$Fungi + labs(x = "Base pairs in query images")

# Combine plots
p_combined <- wrap_plots(p_SRA_families$Metazoa + 
                           theme(legend.position = 'none',
                                 axis.title.x = element_blank()),
                         remove_y_axis_and_scale(p_SRA_families$Viridiplantae),
                         remove_y_axis_and_scale(p_SRA_families$Fungi),
                         nrow = 1)

# Add title and set layout
# Create a blank ggplot object with the desired x-axis title
x_title_plot <- ggplot() + 
  theme_void() + 
  labs(x = "Base pairs in query images") +
  theme(plot.margin = margin(0, 0, 0, 0),
        axis.title.x = element_text(size = 10, hjust = 0.5))


p = wrap_plots(p_combined, x_title_plot,ncol=1,heights = c(0.95,0.05))
    
  

print(p)


ggsave('images_manuscript/fig3_SRA_accuracy.pdf', width=4.5,height = 4)
ggsave('images_manuscript/fig3_SRA_accuracy.png', width=4.5,height = 4,dpi = 1200)

Generating numbers for publication

Here we just query our results to get a few figures that we report in the paper.

Total number of samples used in cross-validation:

dim(samp_labels)

Number of Stigmaphyllon samples with each kind of error for varkoder:

summary_species

Number of Stigmaphyllon samples with each kind of error for skmer:

skmer_summary_species

varKoder accuracy for genera:

summary_genus

varKoder accuracy for family:

summary_family

Skmer accuracy for genera:

skmer_summary_genus

Skmer accuracy for family:

skmer_summary_family

Number of samples available for each genus and data amount

results %>%
  mutate(genus = str_extract(actual_labels,"(?<=genus:)[^;]+")) %>%
  group_by(query_bp) %>%
  summarize(N=n()) %>%
  complete()

Plot number of samples for supplementary material.

n_samples_genera = results %>%
  mutate(taxon = str_extract(actual_labels,"(?<=genus:)[^;]+")) %>%
  group_by(taxon, query_bp) %>%
  summarize(N=n()) %>%
  ungroup() %>%
  complete(taxon, query_bp, fill = list(N=0))
n_samples_genera 

n_samples_species = results %>%
  mutate(taxon = str_extract(actual_labels,"(?<=species:)[^;]+")) %>%
  filter(!is.na(taxon)) %>%
  group_by(taxon, query_bp) %>%
  summarize(N=n()) %>%
  ungroup() %>%
  complete(taxon, query_bp, fill = list(N=0))
n_samples_species 

n_samples_SRA = varKoder_SRA_results %>%
  mutate(taxon = as.character(actual_labels)) %>%
  group_by(taxon, query_bp) %>%
  summarize(N=n()) %>%
  ungroup() %>%
  complete(taxon, query_bp, fill = list(N=0))
n_samples_SRA 
plot_Nsamples_area = function(df, title){
  df = df %>% 
    mutate(query_bp = parse_number(query_bp) *1000)
  
  n_levels <- length(unique(df$taxon))
  viridis_colors <- viridis::turbo(n_levels)
  
  half_n <- ceiling(n_levels / 2)
  reordered_colors <- c(rbind(viridis_colors[1:half_n], viridis_colors[(half_n + 1):n_levels]))


  
  
  ggplot(df, aes(x=query_bp,y=N,fill=taxon, color = taxon, group = taxon)) +
    geom_area(position= position_stack()) +
    #geom_line(position='stack') +
    scale_fill_manual(values = reordered_colors, 
                      aesthetics = c('colour','fill'),
                      guide = 'none') +
    scale_x_log10(labels = scales::label_number(scale_cut = scales::cut_si('bp')),
                  breaks = 1000*parse_number(unique(n_samples_genera$query_bp)),
                  limits = 1000*range(parse_number(unique(n_samples_genera$query_bp))))  +
    scale_y_continuous(n.breaks = 10, minor_breaks = waiver()) +
    ggtitle(title) +
    ylab('Number of samples') +
    xlab('Base pairs in query images') +
    theme_few() +
    theme(axis.text.x = element_text(hjust=1,angle=45),
          panel.background = element_rect(fill = NA),
            panel.grid.major.y = element_line(colour = gray(0.5)),
            panel.grid.minor.y = element_line(colour = gray(0.6),linetype = 2),
            panel.ontop = TRUE)
}
N_species = plot_Nsamples_area(n_samples_species,title='Stigmaphyllon Species')
N_genera = plot_Nsamples_area(n_samples_genera,title='Maplighiaceae and Chrysobalanaceae Genera')
N_families = plot_Nsamples_area(n_samples_SRA,title='SRA familes')

cowplot::plot_grid(N_genera,N_species,N_families, nrow = 1)

Total number of SRA samples. Validation:

read_csv('varKoder/all_SRA/varkoder_trained_model_ML/input_data.csv')[-1] %>%
  group_by(is_valid) %>%
  summarise(N = n())
LS0tCnRpdGxlOiAiVmFyS29kZXIsIFNrbWVyIGFuZCB0cmFkaXRpb25hbCBiYXJjb2RpbmcgQ3Jvc3MtdmFsaWRhdGlvbiIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKVG8gY29tcGFyZSB0aGUgcGVyZm9ybWFuY2Ugb2YgdmFyS29kZSB0byBbU2ttZXJdKGh0dHBzOi8vZ2l0aHViLmNvbS9zaGFoYWItc2FybWFzaGdoaS9Ta21lciksIHdlIHdpbGwgdXNlIGxlYXZlLW9uZS1vdXQgY3Jvc3MgdmFsaWRhdGlvbjogd2UgcmVtb3ZlIG9uZSBzYW1wbGUgZnJvbSB0aGUgZGF0YXNldCwgdHJhaW4gYSB2YXJLb2RlIG1vZGVsIG9yIG1ha2UgYSBza21lciByZWZlcmVuY2Ugd2l0aCB0aGUgcmVtYWluaW5nIHNhbXBsZXMsIGFuZCB0aGVuIHVzZSB0aGUgc2FtcGxlIGxlZnQgb3V0IGFzIHF1ZXJ5LiBXZSB0aGVuIHJlY29yZCB3aGV0aGVyIG9yIG5vdCB3ZSBjb3JyZWN0bHkgaWRlbnRpZnkgdGhpcyBzYW1wbGUgaW4gdmFyS29kZXIsIGFuZCB3aGV0aGVyIG9yIG5vdCB0aGUgY2xvc2VzdCBzYW1wbGUgd2l0aCBTa21lciBoYXMgdGhlIHNhbWUgaWRlbnRpZmljYXRpb24uIAoKRm9yIHRyYWRpdGlvbmFsIGJhcmNvZGVzLCB3ZSBhc3NlbWJsZWQgdGhlIGdlbm9tZSBvZiBlYWNoIHNhbXBsZSwgYW5kIHRoZW4gdXNlZCBCTEFTVCB0byBzZWFyY2ggZm9yIGVhY2ggb2YgdGhlIHRyYWRpdGlvbmFsIGJhcmNvZGUgZ2VuZXMuIFdlIHJlY29yZGVkIGlmIHdlIGNvdWxkIGZpbmQgdGhpcyBnZW5lIGluIHRoZSBhc3NlbWJseSwgY29kaW5nIGFzIG1pc3NpbmcgZGF0YSBpZiB3ZSBjb3VsZCBub3QuIFdlIHRoZW4gcmVjb3JkZWQgd2hldGhlciB0aGUgYmVzdCBCTEFTVCBoaXQgZm9yIGEgc2FtcGxlIHdhcyB0aGUgY29ycmVjdCBzcGVjaWVzLgoKYGBge3J9CnJtKGxpc3Q9bHMoKSkKbGlicmFyeSh0aWR5dmVyc2UpCmxpYnJhcnkoZnV0dXJlKQpsaWJyYXJ5KGdndGhlbWVzKQpsaWJyYXJ5KHBhdGNod29yaykKbGlicmFyeShjb3dwbG90KQpsaWJyYXJ5KHBhdGNod29yaykKbGlicmFyeShwaHl0b29scykKbGlicmFyeShhcGUpCmBgYAojIFZhcktvZGVyCkZvciBWYXJLb2Rlciwgd2UgdXNlZCBsZWF2ZS1vbmUtb3V0IGNyb3NzLXZhbGlkYXRpb24gdG8gdGVzdCB0aGUgYWNjdXJhY3kgZm9yIGZhbWlseSwgZ2VuZXJhLCBzcGVjaWVzIGluIHRoZSBqb2ludCBNYWxwaWdoaWFjZWFlLUNocnlzb2JhbGFuYWNlYWUgZGF0YXNldC4gV2UgdXNlZCBhcyBpbnB1dCBkYXRhIHZhcktvZGVzIHByb2R1Y2VkIGZyb20ga21lcnMgb2Ygc2l6ZSA3IGFuZCA1MDBLYnAgdG8gMjAwTWJwIG9mIGRhdGEsIG9yIGFsbCBvZiB0aGUgZGF0YSBhdmFpbGFibGUgaWYgbGVzcyB0aGFuIDIwMCBNYnAuIEZvciBlYWNoIHNhbXBsZSwgd2UgYnVpbHQgYSBtb2RlbCB1c2luZyBhcyBpbnB1dCBkYXRhIGZyb20gYWxsIG90aGVyIHNhbXBsZXMuIFRoZW4gd2UgcXVlcmllZCB0aGUgc2FtcGxlIGxlZnQgb3V0LCB1c2luZyBhcyBpbnB1dCB0aGUgaW1hZ2VzIGdlbmVyYXRlZCBmcm9tIDUwMEtiIHRvIHRoZSB0b3RhbCBkYXRhIGF2YWlsYWJsZS4gTm93IHdlIHdpbGwgc3VtbWFyaXplIHRoZSByZXN1bHRzLgoKCiMjIEFjY3VyYWN5IHZzIGRhdGEgYW1vdW50IGFuZCB0YXhvbm9taWMgbGV2ZWxzCgpJbiB0aGlzIHRlc3QsIHdlIHVzZWQgdmFyS29kZXIgW3YwLjYuMF0oaHR0cHM6Ly9naXRodWIuY29tL2JydW5vYXNtL3ZhcktvZGVyL3JlbGVhc2VzL3RhZy92LjAuNi4wKS4gTGV0J3MgcHJvY2VzcyB0aGUgcmVzdWx0cy4KCmBgYHtyfQpyZWFkX2FuZF9wcm9jZXNzX3h2YWwgPSBmdW5jdGlvbihpbmZvbGRlcil7CiAgcGxhbihtdWx0aXNlc3Npb24od29ya2VycyA9IDEyKSkKdmFya29kZXJfcmVzdWx0cyA9IGxpc3QuZmlsZXMoaW5mb2xkZXIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgJ3ByZWRpY3Rpb25zLmNzdicsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgcmVjdXJzaXZlPVQsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgZnVsbC5uYW1lcyA9IFQpICU+JQogIGZ1cnJyOjpmdXR1cmVfbWFwX2Rmcih+cmVhZF9jc3YoLngpICU+JSBtdXRhdGUoc2FtcGxlX2lkID0gYXMuY2hhcmFjdGVyKHNhbXBsZV9pZCkpKSAlPiUgCiAgc2VsZWN0KC0xKSAlPiUKICBmaWx0ZXIoc3RyX2RldGVjdChxdWVyeV9iYXNlcGFpcnMsJ14wK1sxMjVdMCtLJCcpKSAlPiUgI3dlIHdpbGwgaWdub3JlIHF1ZXJpZXMgdGhhdCBhcmUgbm90IHN0YW5kYXJkaXplZCBzaXplcwogIHJlbmFtZShxdWVyeV9icCA9IHF1ZXJ5X2Jhc2VwYWlycykgJT4lCiAgbXV0YXRlKHF1YWxpdHlfaW5jbHVkZWQgPSBUKQpwbGFuKHNlcXVlbnRpYWwpCgphbGxfdGF4bGFiZWxzID0gc3RyX3JlbW92ZSh2YXJrb2Rlcl9yZXN1bHRzJGFjdHVhbF9sYWJlbHMsIjsqbG93X3F1YWxpdHk6VHJ1ZTsqIikgJT4lIHN0cl9zcGxpdCgnOycpICU+JSB1bmxpc3QgJT4lIHVuaXF1ZQoKdmFya29kZXJfcmVzdWx0cyA9IHZhcmtvZGVyX3Jlc3VsdHMgJT4lCiAgbXV0YXRlKHF1ZXJ5X2xhYmVscyA9IHN0cl9yZW1vdmUoYWN0dWFsX2xhYmVscywiOypsb3dfcXVhbGl0eTpUcnVlOyoiKSAlPiUgc3RyX3NwbGl0KCc7JyksCiAgICAgICAgIHByZWRpY3RlZF9saXN0ID0gc3RyX3NwbGl0KHByZWRpY3RlZF9sYWJlbHMsJzsnKQogICAgICAgICApICU+JQogIHJvd3dpc2UoKSAlPiUKICBtdXRhdGUoZmFtaWx5X2NvcnJlY3QgPSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsJ2ZhbWlseScpXSAlaW4lIHByZWRpY3RlZF9saXN0LAogICAgICAgICBnZW51c19jb3JyZWN0ID0gcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCdnZW51cycpXSAlaW4lIHByZWRpY3RlZF9saXN0LAogICAgICAgICBzcGVjaWVzX2NvcnJlY3QgPSBpZmVsc2UoYW55KHN0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCdzcGVjaWVzJykpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCdzcGVjaWVzJyldICVpbiUgcHJlZGljdGVkX2xpc3QsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBOQQogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgKSwKICAgICAgICAgZmFtaWx5X2luY29ycmVjdCA9IGFueSghKHByZWRpY3RlZF9saXN0W3N0cl9kZXRlY3QocHJlZGljdGVkX2xpc3QsJ2ZhbWlseScpXSAlaW4lIHF1ZXJ5X2xhYmVsc1tzdHJfZGV0ZWN0KHF1ZXJ5X2xhYmVscywnZmFtaWx5JyldKSksCiAgICAgICAgIGdlbnVzX2luY29ycmVjdCA9IGFueSghKHByZWRpY3RlZF9saXN0W3N0cl9kZXRlY3QocHJlZGljdGVkX2xpc3QsJ2dlbnVzJyldICVpbiUgcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCdnZW51cycpXSkpLAogICAgICAgICBzcGVjaWVzX2luY29ycmVjdCA9IGlmZWxzZShhbnkoc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsJ3NwZWNpZXMnKSksCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBhbnkoIShwcmVkaWN0ZWRfbGlzdFtzdHJfZGV0ZWN0KHByZWRpY3RlZF9saXN0LCdzcGVjaWVzJyldICVpbiUgcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCdzcGVjaWVzJyldKSksCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBOQQogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgKQogICAgICAgICAKICAgICAgICAgKQoKcmV0dXJuKHZhcmtvZGVyX3Jlc3VsdHMpCn0KYGBgCgoKYGBge3J9CnN1bW1hcml6ZV9yZXN1bHRzID0gZnVuY3Rpb24ocmVzLGxldmVsKXsKICByZXMgPSByZXMgJT4lCiAgICB1bmdyb3VwKCkgJT4lCiAgICBtdXRhdGUobG93X3F1YWxpdHkgPSBzdHJfZGV0ZWN0KGFjdHVhbF9sYWJlbHMsImxvd19xdWFsaXR5OlRydWUiKSwKICAgICAgICAgICByZXN1bHQgPSBhcy5jaGFyYWN0ZXIoaWZlbHNlKHJlc1ssc3RyX2MobGV2ZWwsJ2NvcnJlY3QnLHNlcD0nXycpXSAmICFyZXNbLHN0cl9jKGxldmVsLCdpbmNvcnJlY3QnLHNlcD0nXycpXSwgJ2NvcnJlY3QnLAogICAgICAgICAgICAgICAgICAgICAgICAgICBpZmVsc2UocmVzWyxzdHJfYyhsZXZlbCwnY29ycmVjdCcsc2VwPSdfJyldICYgcmVzWyxzdHJfYyhsZXZlbCwnaW5jb3JyZWN0JyxzZXA9J18nKV0sICdhbWJpZ3VvdXMnLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgaWZlbHNlKCFyZXNbLHN0cl9jKGxldmVsLCdjb3JyZWN0JyxzZXA9J18nKV0gICYgcmVzWyxzdHJfYyhsZXZlbCwnaW5jb3JyZWN0JyxzZXA9J18nKV0sICdpbmNvcnJlY3QnLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgJ2luY29uY2x1c2l2ZScKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICkpKSkKICAgICAgICAgICApICU+JQogICAgZmlsdGVyKCFpcy5uYShyZXN1bHQpKSAlPiUKICAgIGdyb3VwX2J5KHF1ZXJ5X2JwLHJlc3VsdCkgJT4lCiAgICBzdW1tYXJpc2UoTj1uKCksIC5ncm91cHMgPSAnZHJvcCcpICU+JQogICAgZ3JvdXBfYnkocXVlcnlfYnApICU+JQogICAgbXV0YXRlKHA9IE4vc3VtKE4pKSAlPiUKICAgIG11dGF0ZShxdWVyeV9icCA9IGFzLmludGVnZXIoc3RyX3JlbW92ZShxdWVyeV9icCwnSycpKSoxMDAwKSAlPiUKICAgIHVuZ3JvdXAoKSAlPiUKICAgIG11dGF0ZShxdWVyeV9icCA9IGFzLmZhY3RvcihxdWVyeV9icCkpICU+JQogICAgY29tcGxldGUocXVlcnlfYnAscmVzdWx0LCBmaWxsID0gbGlzdChwID0gMCwgTiA9IDApKSAlPiUKICAgIG11dGF0ZShxdWVyeV9icCA9IGFzLm51bWVyaWMoYXMuY2hhcmFjdGVyKHF1ZXJ5X2JwKSkpICU+JQogICAgdW5ncm91cCgpCiAgICAKICByZXR1cm4ocmVzKQp9CmBgYAoKCmBgYHtyfQpwbG90X2FyZWEgPSBmdW5jdGlvbihzdW1fZGYsIHRpdGxlLCByZWxhdGl2ZSA9IEZBTFNFLCBncmlkID0gVFJVRSwgeGxpbV9hbGwgPSBUUlVFKXsKICBicmVha3MgPSBjKDUwMDAwMCwKICAgICAgICAgICAgIDEwMDAwMDAsCiAgICAgICAgICAgICAyMDAwMDAwLAogICAgICAgICAgICAgNTAwMDAwMCwKICAgICAgICAgICAgIDEwMDAwMDAwLAogICAgICAgICAgICAgMjAwMDAwMDAsCiAgICAgICAgICAgICA1MDAwMDAwMCwKICAgICAgICAgICAgIDEwMDAwMDAwMCwKICAgICAgICAgICAgIDIwMDAwMDAwMAogICAgICAgICAgICAgKQogIGlmICh4bGltX2FsbCl7CiAgICB4bGltaXRzID0gcmFuZ2UoYnJlYWtzKQogIH0gZWxzZSB7CiAgICB4bGltaXRzID0gcmFuZ2Uoc3VtX2RmJHF1ZXJ5X2JwKQogIH0KICAKICAKICBzdW1fZGYgPSBzdW1fZGYgJT4lCiAgICBtdXRhdGUocmVzdWx0ID0gZmFjdG9yKHJlc3VsdCxvcmRlcmVkID0gVCwgbGV2ZWxzID0gYygnY29ycmVjdCcsJ2FtYmlndW91cycsJ2luY29uY2x1c2l2ZScsJ2luY29ycmVjdCcpKSkgCiAgaWYgKHJlbGF0aXZlKXsKICAgIHlsaW1pdHMgPSBjKDAsMSkKICB9IGVsc2UgewogICAgeWxpbWl0cyA9IGMoMCxzdW1fZGYgJT4lIGdyb3VwX2J5KHF1ZXJ5X2JwKSAlPiUgc3VtbWFyaXplKE49c3VtKE4pKSAlPiUgcHVsbChOKSAlPiUgbWF4KQogIH0KICAKICAKICAjIEdldCBjb2xvcnMgZnJvbSBhIENvbG9yIEJyZXdlciBwYWxldHRlCiAgYnJld2VyX2NvbG9ycyA8LSBSQ29sb3JCcmV3ZXI6OmJyZXdlci5wYWwoNCwgIkFjY2VudCIpCiAgCiAgaWYgKHJlbGF0aXZlKSB7CiAgICBwMSA9IGdncGxvdChzdW1fZGYsIGFlcyh4PXF1ZXJ5X2JwLHk9cCxmaWxsPXJlc3VsdCkpICsKICAgIGdlb21fYXJlYShwb3NpdGlvbj0nc3RhY2snKSArCiAgICBzY2FsZV9maWxsX21hbnVhbCh2YWx1ZXMgPSBzZXROYW1lcyhicmV3ZXJfY29sb3JzLCBjKCJjb3JyZWN0IiwgImFtYmlndW91cyIsICJpbmNvbmNsdXNpdmUiLCAiaW5jb3JyZWN0IikpKSArCiAgICBzY2FsZV9hbHBoYV9tYW51YWwodmFsdWVzPWMoMC41LDEpKSArCiAgICBzY2FsZV94X2xvZzEwKGxhYmVscyA9IHNjYWxlczo6bGFiZWxfbnVtYmVyKHNjYWxlX2N1dCA9IHNjYWxlczo6Y3V0X3NpKCdicCcpKSxicmVha3MgPSBicmVha3MpICArCiAgICBzY2FsZV95X2NvbnRpbnVvdXMoKSArCiAgICBnZ3RpdGxlKHRpdGxlKSArCiAgICB5bGFiKCdGcmFjdGlvbiBvZiBzYW1wbGVzJykgKwogICAgeGxhYignQmFzZSBwYWlycyBpbiBxdWVyeSBpbWFnZXMnKSArCiAgICB0aGVtZV9mZXcoKSArCiAgICB0aGVtZShheGlzLnRleHQueCA9IGVsZW1lbnRfdGV4dChoanVzdD0xLGFuZ2xlPTQ1KSkKICB9IGVsc2UgewogICAgICBwMSA9IGdncGxvdChzdW1fZGYsIGFlcyh4PXF1ZXJ5X2JwLHk9TixmaWxsPXJlc3VsdCkpICsKICAgIGdlb21fYXJlYShwb3NpdGlvbj0nc3RhY2snKSArCiAgICBzY2FsZV9maWxsX21hbnVhbCh2YWx1ZXMgPSBzZXROYW1lcyhicmV3ZXJfY29sb3JzLCBjKCJjb3JyZWN0IiwgImFtYmlndW91cyIsICJpbmNvbmNsdXNpdmUiLCAiaW5jb3JyZWN0IikpKSArCiAgICBzY2FsZV9hbHBoYV9tYW51YWwodmFsdWVzPWMoMC41LDEpKSArCiAgICBzY2FsZV94X2xvZzEwKGxhYmVscyA9IHNjYWxlczo6bGFiZWxfbnVtYmVyKHNjYWxlX2N1dCA9IHNjYWxlczo6Y3V0X3NpKCdicCcpKSxicmVha3MgPSBicmVha3MpICAgKwogICAgc2NhbGVfeV9jb250aW51b3VzKCkgKwogICAgZ2d0aXRsZSh0aXRsZSkgKwogICAgeWxhYignTnVtYmVyIG9mIHNhbXBsZXMnKSArCiAgICB4bGFiKCdCYXNlIHBhaXJzIGluIHF1ZXJ5IGltYWdlcycpICsKICAgIHRoZW1lX2ZldygpICsKICAgIHRoZW1lKGF4aXMudGV4dC54ID0gZWxlbWVudF90ZXh0KGhqdXN0PTEsYW5nbGU9NDUpKQogIH0KICAKICBpZiAoZ3JpZCl7CiAgICBwMSA9IHAxICsKICAgICAgc2NhbGVfeV9jb250aW51b3VzKG4uYnJlYWtzID0gMTAsIG1pbm9yX2JyZWFrcyA9IHdhaXZlcigpKSArCiAgICAgIHRoZW1lKHBhbmVsLmJhY2tncm91bmQgPSBlbGVtZW50X3JlY3QoZmlsbCA9IE5BKSwKICAgICAgICAgICAgcGFuZWwuZ3JpZC5tYWpvci55ID0gZWxlbWVudF9saW5lKGNvbG91ciA9IGdyYXkoMC41KSksCiAgICAgICAgICAgIHBhbmVsLmdyaWQubWlub3IueSA9IGVsZW1lbnRfbGluZShjb2xvdXIgPSBncmF5KDAuNiksbGluZXR5cGUgPSAyKSwKICAgICAgICAgICAgcGFuZWwub250b3AgPSBUUlVFKQogIH0KICAKICBwMSA9IHAxICsgY29vcmRfY2FydGVzaWFuKHhsaW09eGxpbWl0cywgeWxpbT15bGltaXRzLGV4cGFuZCA9IEZBTFNFKQogIAogIHJldHVybihwMSkKfQogIApgYGAKCgpOb3cgbGV0J3MgcGxvdCBnZW51cy1sZXZlbCBhY2N1cmFjeSBmb3IgYSBtb2RlbCB0YWtpbmcgcXVhbGl0eSBsYWJlbHMgaW50byBhY2NvdW50OgoKCmBgYHtyLCBtZXNzYWdlID0gRkFMU0UsIHdhcm5pbmcgPSBGQUxTRX0KcmVzdWx0cyA9IHJlYWRfYW5kX3Byb2Nlc3NfeHZhbCgnTWFscGlnaGlhY2VhZStDaHJ5c29iYWxhbmFjZWFlL3ZhcktvZGVyL3ZpdF9yZXN1bHRzLycpCnN1bW1hcnlfZ2VudXMgPSBzdW1tYXJpemVfcmVzdWx0cyhyZXN1bHRzLCdnZW51cycpCnBfZ2VudXMgPSBwbG90X2FyZWEoc3VtbWFyeV9nZW51cywgJ3ZhcktvZGVyIGdlbnVzJywgcmVsYXRpdmUgPSBUUlVFKQpwX2dlbnVzCmBgYApOb3cgdGhlIHNhbWUgYnV0IHdpdGggc3BlY2llcwpgYGB7cn0Kc3VtbWFyeV9zcGVjaWVzID0gc3VtbWFyaXplX3Jlc3VsdHMocmVzdWx0cywnc3BlY2llcycpCnBfc3BlY2llcyA9IHBsb3RfYXJlYShzdW1tYXJ5X3NwZWNpZXMsICd2YXJLb2RlciBzcGVjaWVzJywgcmVsYXRpdmUgPSBUUlVFKQpwX3NwZWNpZXMKYGBgCgpGaW5hbGx5LCBmYW1pbHkKYGBge3J9CnN1bW1hcnlfZmFtaWx5ID0gc3VtbWFyaXplX3Jlc3VsdHMocmVzdWx0cywnZmFtaWx5JykKcF9mYW1pbHkgPSBwbG90X2FyZWEoc3VtbWFyeV9mYW1pbHksICd2YXJLb2RlciBmYW1pbHknLCByZWxhdGl2ZSA9IFRSVUUpCnBfZmFtaWx5CmBgYAojIyB3aGF0IGV4cGxhaW5zIHRoZSBlcnJvcnM/CgpOb3cgd2Ugd2lsbCB0cnkgdG8gaWRlbnRpZnkgd2hpY2ggc2FtcGxlcyBmYWlsZWQgYW5kIHdoeSB0aGV5IGZhaWxlZC4gUGFydGljdWFybHksIGhvdyBkbyAKRE5BIHF1YWxpdHksIGFtb3VudCBvZiBkYXRhLCBhbmQgdGhlIG51bWJlciBvZiBzYW1wbGVzIHBlciBjbGFzcyBpbXBhY3QgcmVzdWx0cz8gV2Ugd2lsbCB1c2UgZ2VudXMtbGV2ZWwgcHJlZGljdGlvbnMgdG8gdGVzdC4KCmBgYHtyfQpnZW51c19wcmVkaWN0aW9ucyA9IHJlc3VsdHMgJT4lCiAgbXV0YXRlKHByZWRpY3RlZF9nZW51cyA9IHN0cl9leHRyYWN0KHByZWRpY3RlZF9sYWJlbHMsICdnZW51czpbXjtdKicpLAogICAgICAgICBhY3R1YWxfZ2VudXMgPSBzdHJfZXh0cmFjdChhY3R1YWxfbGFiZWxzLCAnZ2VudXM6W147XSonKSkgJT4lCiAgc2VsZWN0KC1zdGFydHNfd2l0aCgnZmFtaWx5JyksLXN0YXJ0c193aXRoKCdzcGVjaWVzJykpICU+JQogIHBpdm90X2xvbmdlcihjb2xzID0gc3RhcnRzX3dpdGgoImdlbnVzIiksIG5hbWVzX3RvID0gInByZWRpY3RlZF9sYWJlbCIsIHZhbHVlc190byA9ICJjb25maWRlbmNlIikgJT4lCiAgZmlsdGVyKGFjdHVhbF9nZW51cyA9PSBwcmVkaWN0ZWRfbGFiZWwpICU+JQogIHNlbGVjdChxdWVyeV9icCwgc2FtcGxlX2lkLCBiYXNlZnJlcXVlbmN5X3NkLCBhY3R1YWxfZ2VudXMsIGNvbmZpZGVuY2UpICU+JQogIG11dGF0ZShxdWVyeV9icCA9IDEwMDAqKHN0cl9yZW1vdmUocXVlcnlfYnAsICJLIikgJT4lIGFzLmludGVnZXIpKQoKZ2VudXNfcHJlZGljdGlvbnMgPSBnZW51c19wcmVkaWN0aW9ucyAlPiUKICBzZWxlY3Qoc2FtcGxlX2lkLCBhY3R1YWxfZ2VudXMpICU+JQogIGRpc3RpbmN0KCkgJT4lCiAgZ3JvdXBfYnkoYWN0dWFsX2dlbnVzKSAlPiUKICBzdW1tYXJpc2UoTl9zYW1wbGVzID0gbigpKSAlPiUKICByaWdodF9qb2luKGdlbnVzX3ByZWRpY3Rpb25zKQoKZ2VudXNfcHJlZGljdGlvbnMKYGBgCk5vdyBsZXQncyBtYWtlIHNvbWUgcGxvdHMuIEZpcnN0LCB3aGF0IGlzIHRoZSBlZmZlY3Qgb2YgbnVtYmVyIG9mIHNhbXBsZXMgcGVyIGNsYXNzIGluIGNvbmZpZGVuY2U/CmBgYHtyfQpwbG90X2dlbnVzX05fdnNfY29uZiA9IGdncGxvdChnZW51c19wcmVkaWN0aW9ucywgYWVzKHggPSBOX3NhbXBsZXMtMSwgCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIHkgPSBjb25maWRlbmNlKSkgKyAKICBzY2FsZV9jb2xvcl92aXJpZGlzX2MoKSArCiAgZ2VvbV9qaXR0ZXIoYWxwaGE9MC4zKSArIAogIHNjYWxlX3hfbG9nMTAoKSArCiAgI3lsYWIoJ0NvbmZpZGVuY2UgaW4gY29ycmVjdCBwcmVkaWN0aW9uXG4obG9naXQgc2NhbGUpJykgKwogIHlsYWIoJ0NvbmZpZGVuY2UgaW4gY29ycmVjdCBwcmVkaWN0aW9uJykgKwogIHhsYWIoJ051bWJlciBvZiBzYW1wbGVzIGluIGNvcnJlY3QgZ2VudXNcbihsb2cgc2NhbGUpJykgKwogICNzY2FsZV95X2NvbnRpbnVvdXModHJhbnMgPSAibG9naXQiLCBicmVha3MgPSBjKDFlLTQsMC4wMDEsMC4wMSwwLjEsMC4yNSwwLjUsMC43NSwwLjksMC45OSwwLjk5OSwxLTFlLTQpKSArCiAgc2NhbGVfeV9jb250aW51b3VzKGxpbWl0cz1jKDAsMSkpICsKICB0aGVtZV9mZXcoKSArCiAgdGhlbWUocGFuZWwuZ3JpZC5tYWpvci55ID0gZWxlbWVudF9saW5lKGNvbG91ciA9IGdyYXkoMC44KSkpCgpwbG90X2dlbnVzX05fdnNfY29uZgpgYGAKCk5vdywgd2hhdCBpcyB0aGUgZWZmZWN0IG9mIHNhbXBsZSBxdWFsaXR5IGluIGNvbmZpZGVuY2U/CmBgYHtyfQpwbG90X2dlbnVzX2ZyZXFzZF92c19jb25mID0gZ2dwbG90KGdlbnVzX3ByZWRpY3Rpb25zLCBhZXMoeCA9IGJhc2VmcmVxdWVuY3lfc2QsIHkgPSBjb25maWRlbmNlKSkgKyAKICBnZW9tX3BvaW50KGFscGhhPTAuMykgKyAKICBzY2FsZV94X2xvZzEwKCkgKwogICNzY2FsZV95X2NvbnRpbnVvdXModHJhbnMgPSAibG9naXQiLCBicmVha3MgPSBjKDFlLTQsMC4wMDEsMC4wMSwwLjEsMC4yNSwwLjUsMC43NSwwLjksMC45OSwwLjk5OSwxLTFlLTQpKSArCiAgc2NhbGVfeV9jb250aW51b3VzKGxpbWl0cz1jKDAsMSkpICsKICAjeWxhYignQ29uZmlkZW5jZSBpbiBjb3JyZWN0IHByZWRpY3Rpb25cbihsb2dpdCBzY2FsZSknKSArCiAgeWxhYignQ29uZmlkZW5jZSBpbiBjb3JyZWN0IHByZWRpY3Rpb24nKSArCiAgeGxhYignU3RhbmRhcmQgZGV2aWF0aW9uIG9mIGJhc2UgZnJlcXVlbmNpZXMnKSArCiAgdGhlbWVfZmV3KCkgKwogIHRoZW1lKHBhbmVsLmdyaWQubWFqb3IueSA9IGVsZW1lbnRfbGluZShjb2xvdXIgPSBncmF5KDAuOCkpKQoKcGxvdF9nZW51c19mcmVxc2RfdnNfY29uZgpgYGAKCk5vdywgd2hhdCBpcyB0aGUgZWZmZWN0IG9mIGFtb3VudCBvZiBkYXRhIGluIGNvbmZpZGVuY2U/CmBgYHtyfQpwbG90X2dlbnVzX2JwX3ZzX2NvbmYgPSBnZ3Bsb3QoZ2VudXNfcHJlZGljdGlvbnMsIGFlcyh4ID0gcXVlcnlfYnAsIHkgPSBjb25maWRlbmNlKSkgKyAKICBnZW9tX2ppdHRlcihhbHBoYT0wLjMpICsgCiAgI3NjYWxlX3lfY29udGludW91cyh0cmFucyA9ICJsb2dpdCIsIGJyZWFrcyA9IGMoMWUtNCwwLjAwMSwwLjAxLDAuMSwwLjI1LDAuNSwwLjc1LDAuOSwwLjk5LDAuOTk5LDEtMWUtNCkpICsKICBzY2FsZV95X2NvbnRpbnVvdXMobGltaXRzPWMoMCwxKSkgKwogICN5bGFiKCdDb25maWRlbmNlIGluIGNvcnJlY3QgcHJlZGljdGlvblxuKGxvZ2l0IHNjYWxlKScpICsKICB5bGFiKCdDb25maWRlbmNlIGluIGNvcnJlY3QgcHJlZGljdGlvbicpICsKICB4bGFiKCdCYXNlIHBhaXJzIGluIHF1ZXJ5IGltYWdlc1xuKGxvZyBzY2FsZSknKSArCiAgc2NhbGVfeF9sb2cxMCgpICsKICB0aGVtZV9mZXcoKSArCiAgdGhlbWUocGFuZWwuZ3JpZC5tYWpvci55ID0gZWxlbWVudF9saW5lKGNvbG91ciA9IGdyYXkoMC44KSkpCgpwbG90X2dlbnVzX2JwX3ZzX2NvbmYKYGBgCgpOb3cgbGV0J3Mgc2F2ZSB0aGUgdGhyZWUgb2YgdGhlbSBhcyBhIHNpbmdsZSBwbG90IHVzaW5nIGNvd3Bsb3QuCgpgYGB7cn0KY29tYmluZWRfY29uZiA9IHBhdGNod29yazo6d3JhcF9wbG90cyhwbG90X2dlbnVzX05fdnNfY29uZiArIHRoZW1lKHRleHQgPSBlbGVtZW50X3RleHQoc2l6ZT04KSksCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgcGxvdF9nZW51c19icF92c19jb25mICsgdGhlbWUoYXhpcy50aXRsZS55PWVsZW1lbnRfYmxhbmsoKSwgCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgYXhpcy50ZXh0Lnk9ZWxlbWVudF9ibGFuaygpLCAKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICB0ZXh0ID0gZWxlbWVudF90ZXh0KHNpemU9OCkpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIHBsb3RfZ2VudXNfZnJlcXNkX3ZzX2NvbmYgKyB0aGVtZShheGlzLnRpdGxlLnk9ZWxlbWVudF9ibGFuaygpLCAKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgYXhpcy50ZXh0Lnk9ZWxlbWVudF9ibGFuaygpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICB0ZXh0ID0gZWxlbWVudF90ZXh0KHNpemU9OCkpKSArCiAgcGF0Y2h3b3JrOjpwbG90X2Fubm90YXRpb24odGFnX2xldmVscyA9ICdBJykgCgpjb21iaW5lZF9jb25mCgpnZ3NhdmUoZmlsZW5hbWUgPSAnaW1hZ2VzX21hbnVzY3JpcHQvc3VwcF9jb25mX3ByZWRpY3RvcnMucGRmJyxkZXZpY2UgPSAncGRmJyx3aWR0aCA9IDcsaGVpZ2h0PTMsdW5pdHMgPSAnaW4nLHVzZURpbmdiYXRzPUYpCmBgYAoKCkxldCdzIHB1dCBpdCBhbGwgdG9nZXRoZXIgbm93IGluIGEgbGluZWFyIG1vZGVsOgoKYGBge3J9CmxtX2RhdGEgPSBnZW51c19wcmVkaWN0aW9ucyAlPiUKICBtdXRhdGUoY29uZmlkZW5jZSA9IGlmZWxzZShjb25maWRlbmNlID09IDEsIGNvbmZpZGVuY2UtMC4wMDAwMDAxLCBjb25maWRlbmNlKSwKICAgICAgICAgY29uZmlkZW5jZSA9IGNhcjo6bG9naXQoY29uZmlkZW5jZSkpICU+JQogIG11dGF0ZShxdWVyeV9icCA9IChxdWVyeV9icCAtIG1lYW4ocXVlcnlfYnApKS9zZChxdWVyeV9icCksCiAgICAgICAgIGJhc2VmcmVxdWVuY3lfc2QgPSAoYmFzZWZyZXF1ZW5jeV9zZCAtIG1lYW4oYmFzZWZyZXF1ZW5jeV9zZCkpL3NkKGJhc2VmcmVxdWVuY3lfc2QpLAogICAgICAgICBOX3NhbXBsZXMgPSAoTl9zYW1wbGVzIC0gbWVhbihOX3NhbXBsZXMpKS9zZChOX3NhbXBsZXMpCiAgICAgICAgICkgCgpmdWxsX21vZGVsID0gbG0oZm9ybXVsYSA9IGNvbmZpZGVuY2V+cXVlcnlfYnAqYmFzZWZyZXF1ZW5jeV9zZCpOX3NhbXBsZXMsIGRhdGEgPSBsbV9kYXRhKSAKZnVsbF9tb2RlbApzdW1tYXJ5KGZ1bGxfbW9kZWwpCnBsb3QoZnVsbF9tb2RlbCkKYGBgCgpgYGB7cn0KcmVkdWNlZF9tb2RlbCA9IHN0ZXAoZnVsbF9tb2RlbCwgZGlyZWN0aW9uID0iYm90aCIpCnJlZHVjZWRfbW9kZWwKc3VtbWFyeShyZWR1Y2VkX21vZGVsKQpwbG90KHJlZHVjZWRfbW9kZWwpCmBgYAoKCgoKCiMjIFNrbWVyCgpGb3Igc2ttZXIsIHdlIGxlZnQgZWFjaCBzYW1wbGUgb3V0LCBidWlsdCBhIHJlZmVyZW5jZSBhbmQgdGhlbiBxdWVyaWVkIHRoYXQgc2FtcGxlLiBXZSBoYXZlIHNldmVyYWwgZmlsZXMgaW4gd2hpY2ggcmVmZXJlbmNlIHNhbXBsZXMgYXJlIG9yZGVyZWQgYnkgdGhlaXIgZGlzdGFuY2UgdG8gdGhlIHF1ZXJ5LCB3ZSBoZXJlIHdlIHdpbGwgZXZhbHVhdGUgd2hldGhlciB0aGUgY2xvc2VzdCBzYW1wbGUgaXMgZnJvbSB0aGUgY29ycmVjdCBzcGVjaWVzIG9yIGdlbnVzLgoKQmVjYXVzZSBpdCBpcyBub3QgY2xlYXIgaG93IHNrbWVyIGJlaGF2ZXMgZm9yIGRpZmZlcmVudCBsZXZlbHMgb2YgY292ZXJhZ2UsIHdlIHJlcGVhdGVkIHRoaXMgZm9yIHNldmVyYWwgaW5wdXQgc2l6ZXMgKGluIG51bWJlciBvZiBiYXNlcGFpcnMpIGFzIHF1ZXJ5LCBidXQgYWx3YXlzIHVzZWQgdGhlIG1heGltdW0gaW5wdXQgZGl6ZSBhdmFpbGFibGUgKHVwIHRvIDIwME1iKSBmb3IgcmVmZXJlbmNlcy4KCkxldCdzIG1ha2UgYSBmdW5jdGlvbiB0aGF0IGV4dHJhY3RzIHRoZXNlIHJlc3VsdHMgYXMgYSB0YWJsZS4KCmBgYHtyfQoKc2FtcF9sYWJlbHMgPSByZXN1bHRzICU+JSBzZWxlY3Qoc2FtcGxlX2lkLGFjdHVhbF9sYWJlbHMpICU+JSBkaXN0aW5jdCgpCgpleHRyYWN0X3NrbWVyX3Jlc3VsdHMgPSBmdW5jdGlvbihmaWxlX3BhdGgpIHsKICAgICMgUmVhZCBvbmx5IHRoZSBmaXJzdCAyIGxpbmVzIG9mIHRoZSBmaWxlCiAgICBmaWxlX2xpbmVzIDwtIHJlYWRMaW5lcyhmaWxlX3BhdGgsIG4gPSAyKQogICAgCiAgICAjIEV4dHJhY3Qgc2FtcGxlX0lELCBiYXNlcGFpcnMgZnJvbSB0aGUgZmlyc3QgbGluZQogICAgc2FtcGxlX2luZm8gPC0gc3RyX21hdGNoKGZpbGVfbGluZXNbMV0sICJcXHMqKC4qPylAKFxcZCtLKSIpWywgMjozXQogICAgc2FtcGxlX0lEIDwtIHNhbXBsZV9pbmZvWzFdCiAgICBiYXNlcGFpcnMgPC0gc2FtcGxlX2luZm9bMl0KICAgIAogICAgIyBFeHRyYWN0IHJlZmVyZW5jZV9zYW1wbGVfSUQsIGRpc3RhbmNlIGZyb20gdGhlIHNlY29uZCBsaW5lCiAgICByZWZlcmVuY2VfaW5mbyA8LSBzdHJfbWF0Y2goZmlsZV9saW5lc1syXSwgIlxccyooLio/KUAuKlxccysoXFxkK1xcLlxcZCspIilbLCAyOjNdCiAgICByZWZlcmVuY2Vfc2FtcGxlX0lEIDwtIHJlZmVyZW5jZV9pbmZvWzFdCiAgICBkaXN0YW5jZSA8LSBhcy5udW1lcmljKHJlZmVyZW5jZV9pbmZvWzJdKQogICAgCiAgICAjIENyZWF0ZSBhIHRpYmJsZQogICAgdGliYmxlKAogICAgICAgIHNhbXBsZV9pZCA9IHNhbXBsZV9JRCwKICAgICAgICBxdWVyeV9icCA9IGJhc2VwYWlycywKICAgICAgICBjbG9zZXN0X3JlZmVyZW5jZV9zYW1wbGVfaWQgPSByZWZlcmVuY2Vfc2FtcGxlX0lELAogICAgICAgIGNsb3Nlc3RfZGlzdGFuY2UgPSBkaXN0YW5jZQogICAgKSAKfQpgYGAKCk5vdyB3ZSB3aWxsIGFwcGx5IHRoaXMgZnVuY3Rpb24gdG8gYWxsIHNrbWVyIG91dHB1dCBmaWxlcy4KCmBgYHtyfQpwbGFuKG11bHRpc2Vzc2lvbih3b3JrZXJzID0gMTIpKQpza21lcl9yZXN1bHRzX2RmID0gZnVycnI6OmZ1dHVyZV9tYXBfZGZyKAogIGxpc3QuZmlsZXMoJ01hbHBpZ2hpYWNlYWUrQ2hyeXNvYmFsYW5hY2VhZS9za21lci9za21lcl94dmFsX3Jlc3VsdHMvJywgZnVsbC5uYW1lcyA9IFQpLAogIH4gZXh0cmFjdF9za21lcl9yZXN1bHRzKC54KQopICU+JQogIGxlZnRfam9pbihzYW1wX2xhYmVscywgYnkgPSAnc2FtcGxlX2lkJykgJT4lCiAgbGVmdF9qb2luKAogICAgc2FtcF9sYWJlbHMgJT4lIHNlbGVjdCgKICAgICAgY2xvc2VzdF9yZWZlcmVuY2Vfc2FtcGxlX2lkID0gJ3NhbXBsZV9pZCcsCiAgICAgIHByZWRpY3RlZF9sYWJlbHMgPSBhY3R1YWxfbGFiZWxzCiAgICApLAogICAgYnkgPSAnY2xvc2VzdF9yZWZlcmVuY2Vfc2FtcGxlX2lkJwogICkgJT4lCiAgbXV0YXRlKAogICAgcXVlcnlfbGFiZWxzID0gc3RyX3JlbW92ZShhY3R1YWxfbGFiZWxzLCAiOypsb3dfcXVhbGl0eTpUcnVlOyoiKSAlPiUgc3RyX3NwbGl0KCc7JyksCiAgICBwcmVkaWN0ZWRfbGlzdCA9IHN0cl9zcGxpdChwcmVkaWN0ZWRfbGFiZWxzLCAnOycpCiAgKSAlPiUKICByb3d3aXNlKCkgJT4lCiAgbXV0YXRlKAogICAgZmFtaWx5X2NvcnJlY3QgPSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdmYW1pbHknKV0gJWluJSBwcmVkaWN0ZWRfbGlzdCwKICAgIGdlbnVzX2NvcnJlY3QgPSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdnZW51cycpXSAlaW4lIHByZWRpY3RlZF9saXN0LAogICAgc3BlY2llc19jb3JyZWN0ID0gaWZlbHNlKGFueShzdHJfZGV0ZWN0KAogICAgICBxdWVyeV9sYWJlbHMsICdzcGVjaWVzJwogICAgKSksCiAgICBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdzcGVjaWVzJyldICVpbiUgcHJlZGljdGVkX2xpc3QsCiAgICBOQSksCiAgICBmYW1pbHlfaW5jb3JyZWN0ID0gYW55KCEocHJlZGljdGVkX2xpc3Rbc3RyX2RldGVjdChwcmVkaWN0ZWRfbGlzdCwgJ2ZhbWlseScpXSAlaW4lIHF1ZXJ5X2xhYmVsc1tzdHJfZGV0ZWN0KHF1ZXJ5X2xhYmVscywgJ2ZhbWlseScpXSkpLAogICAgZ2VudXNfaW5jb3JyZWN0ID0gYW55KCEocHJlZGljdGVkX2xpc3Rbc3RyX2RldGVjdChwcmVkaWN0ZWRfbGlzdCwgJ2dlbnVzJyldICVpbiUgcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCAnZ2VudXMnKV0pKSwKICAgIHNwZWNpZXNfaW5jb3JyZWN0ID0gaWZlbHNlKGFueShzdHJfZGV0ZWN0KAogICAgICBxdWVyeV9sYWJlbHMsICdzcGVjaWVzJwogICAgKSksCiAgICBhbnkoISgKICAgICAgcHJlZGljdGVkX2xpc3Rbc3RyX2RldGVjdChwcmVkaWN0ZWRfbGlzdCwgJ3NwZWNpZXMnKV0gJWluJSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdzcGVjaWVzJyldCiAgICApKSwKICAgIE5BKQogICAgCiAgKQpwbGFuKHNlcXVlbnRpYWwpCnNrbWVyX3Jlc3VsdHNfZGYKYGBgCk5vdyBsZXQncyBzdW1tYXJpemUgYW5kIHBsb3QgYnkgZ2VudXM6CgpgYGB7cn0Kc2ttZXJfc3VtbWFyeV9nZW51cyA9IHN1bW1hcml6ZV9yZXN1bHRzKHNrbWVyX3Jlc3VsdHNfZGYsJ2dlbnVzJykKcF9za21lcl9nZW51cyA9IHBsb3RfYXJlYShza21lcl9zdW1tYXJ5X2dlbnVzLCAnU2ttZXIgZ2VudXMnLCByZWxhdGl2ZSA9IFRSVUUpCnBfc2ttZXJfZ2VudXMKYGBgCk5vdyBieSBzcGVjaWVzLiBJbiBTa21lciwgdGhlcmUgaXMgbm8gaW5jb25jbHVzaXZlIHJlc3VsdDogaWYgdGhlcmUgaXMgbm8gY29ycmVjdCBzcGVjaWVzIHByZWRpY3Rpb24sIGl0IG1lYW5zIHRoYXQgYSBzYW1wbGUgd2FzIHByZWRpY3RlZCBpbiB0aGUgd3JvbmcgZ2VudXMgYW5kIHRoZXJlZm9yZSBpdCBpcyBpbmNvcnJlY3QKCmBgYHtyfQpza21lcl9zdW1tYXJ5X3NwZWNpZXMgPSBzdW1tYXJpemVfcmVzdWx0cyhza21lcl9yZXN1bHRzX2RmLCdzcGVjaWVzJykgJT4lCiAgbXV0YXRlKHJlc3VsdCA9IGlmZWxzZShyZXN1bHQgPT0gJ2NvcnJlY3QnLCAnY29ycmVjdCcsJ2luY29ycmVjdCcpKSAlPiUKICBncm91cF9ieShxdWVyeV9icCxyZXN1bHQpICU+JQogIHN1bW1hcmlzZV9hbGwoc3VtKQpwX3NrbWVyX3NwZWNpZXMgPSBwbG90X2FyZWEoc2ttZXJfc3VtbWFyeV9zcGVjaWVzLCAnU2ttZXIgc3BlY2llcycsIHJlbGF0aXZlID0gVFJVRSkKcF9za21lcl9zcGVjaWVzCmBgYAoKQW5kIG5vdyBieSBmYW1pbHk6CgpgYGB7cn0Kc2ttZXJfc3VtbWFyeV9mYW1pbHkgPSBzdW1tYXJpemVfcmVzdWx0cyhza21lcl9yZXN1bHRzX2RmLCdmYW1pbHknKQpza21lcl9zdW1tYXJ5X2ZhbWlseSAKcF9za21lcl9mYW1pbHkgPSBwbG90X2FyZWEoc2ttZXJfc3VtbWFyeV9mYW1pbHksICdTa21lciBmYW1pbHknLCByZWxhdGl2ZSA9IFRSVUUpCnBfc2ttZXJfZmFtaWx5CmBgYAoKIyBUcmFkaXRpb25hbCBiYXJjb2RlcwojIyBCTEFTVCBzaW5nbGUgZ2VuZQpMZXQncyBub3cgcmVhZCB0aGUgdHJhZGl0aW9uYWwgYmFyY29kZSBCTEFTVCByZXN1bHRzIGFuZCBzdW1tYXJpemUgdGhlbSBpbiB0aGUgc2FtZSB3YXkgYXMgc2ttZXIgYW5kIHZhcktvZGVyLiBMZXQncyBzdGFydCBieSBkZWZpbmluZyBhIGZ1Y3Rpb24gdGhhdCByZWFkcyB0aGUgZGF0YSBzbyB3ZSBjYW4gc3VtbWFyaXplIGl0IHVzaW5nIHRoZSBwcmV2aW91c2x5IGRlZmluZWQgZnVuY3Rpb25zLgoKYGBge3J9CnJlYWRfdHJhZGl0aW9uYWxfYmFyY29kZXMgPSBmdW5jdGlvbihicCkgewogIGlucHV0X2ZpbGUgPSBwYXN0ZTAoCiAgICAnTWFscGlnaGlhY2VhZStDaHJ5c29iYWxhbmFjZWFlL3RyYWRpdGlvbmFsX2JhcmNvZGVzLzJfYmxhc3RfcGh5bG9nZW55X3Jlc3VsdC9HZW51cy8nLAogICAgYnAsCiAgICAnTV9ibGFzdF9waHlsb19zdW1fc3AudHN2JwogICkKICAKICBiYXJjb2RlX3JlcyA9IHJlYWRfZGVsaW0oaW5wdXRfZmlsZSkgJT4lCiAgICBwaXZvdF9sb25nZXIoLXNwLCBuYW1lc190byA9ICdtYXJrZXInLCB2YWx1ZXNfdG8gPSAnY2xvc2VzdF9yZWZlcmVuY2Vfc2FtcGxlX2lkJykgJT4lCiAgICByZW5hbWUoc2FtcGxlX2lkID0gJ3NwJykgJT4lCiAgICBtdXRhdGUoCiAgICAgIHNhbXBsZV9pZCA9IHN0cl9yZW1vdmVfYWxsKHNhbXBsZV9pZCwgJ0AuKycpLAogICAgICBjbG9zZXN0X3JlZmVyZW5jZV9zYW1wbGVfaWQgPSBzdHJfcmVtb3ZlX2FsbChjbG9zZXN0X3JlZmVyZW5jZV9zYW1wbGVfaWQsICdALisnKSwKICAgICAgcHJlZGljdGVkX2xhYmVscyA9IHNhbXBfbGFiZWxzJGFjdHVhbF9sYWJlbHNbbWF0Y2goY2xvc2VzdF9yZWZlcmVuY2Vfc2FtcGxlX2lkLCBzYW1wX2xhYmVscyRzYW1wbGVfaWQpXSwKICAgICAgYWN0dWFsX2xhYmVscyA9IHNhbXBfbGFiZWxzJGFjdHVhbF9sYWJlbHNbbWF0Y2goc2FtcGxlX2lkLCBzYW1wX2xhYmVscyRzYW1wbGVfaWQpXQogICAgKSAlPiUKICAgIGZpbHRlcihtYXJrZXIgIT0gJ0NvbmNhdGVuYXRlZF9waHlsb2dlbnknKSAlPiUKICAgIG11dGF0ZSgKICAgICAgcXVlcnlfbGFiZWxzID0gc3RyX3JlbW92ZShhY3R1YWxfbGFiZWxzLCAiOypsb3dfcXVhbGl0eTpUcnVlOyoiKSAlPiUgc3RyX3NwbGl0KCc7JyksCiAgICAgIHByZWRpY3RlZF9saXN0ID0gc3RyX3NwbGl0KHByZWRpY3RlZF9sYWJlbHMsICc7JykKICAgICkgJT4lCiAgICByb3d3aXNlKCkgJT4lCiAgICBtdXRhdGUoCiAgICAgIGZhbWlseV9jb3JyZWN0ID0gcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCAnZmFtaWx5JyldICVpbiUgcHJlZGljdGVkX2xpc3QsCiAgICAgIGdlbnVzX2NvcnJlY3QgPSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdnZW51cycpXSAlaW4lIHByZWRpY3RlZF9saXN0LAogICAgICBzcGVjaWVzX2NvcnJlY3QgPSBpZmVsc2UoYW55KHN0cl9kZXRlY3QoCiAgICAgICAgcXVlcnlfbGFiZWxzLCAnc3BlY2llcycKICAgICAgKSksCiAgICAgIHF1ZXJ5X2xhYmVsc1tzdHJfZGV0ZWN0KHF1ZXJ5X2xhYmVscywgJ3NwZWNpZXMnKV0gJWluJSBwcmVkaWN0ZWRfbGlzdCwKICAgICAgTkEpLAogICAgICBmYW1pbHlfaW5jb3JyZWN0ID0gYW55KCEocHJlZGljdGVkX2xpc3Rbc3RyX2RldGVjdChwcmVkaWN0ZWRfbGlzdCwgJ2ZhbWlseScpXSAlaW4lIHF1ZXJ5X2xhYmVsc1tzdHJfZGV0ZWN0KHF1ZXJ5X2xhYmVscywgJ2ZhbWlseScpXSkpLAogICAgICBnZW51c19pbmNvcnJlY3QgPSBhbnkoIShwcmVkaWN0ZWRfbGlzdFtzdHJfZGV0ZWN0KHByZWRpY3RlZF9saXN0LCAnZ2VudXMnKV0gJWluJSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdnZW51cycpXSkpLAogICAgICBzcGVjaWVzX2luY29ycmVjdCA9IGlmZWxzZShhbnkoc3RyX2RldGVjdCgKICAgICAgICBxdWVyeV9sYWJlbHMsICdzcGVjaWVzJwogICAgICApKSwKICAgICAgYW55KCEoCiAgICAgICAgcHJlZGljdGVkX2xpc3Rbc3RyX2RldGVjdChwcmVkaWN0ZWRfbGlzdCwgJ3NwZWNpZXMnKV0gJWluJSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdzcGVjaWVzJyldCiAgICAgICkpLAogICAgICBOQSkKICAgICkgJT4lCiAgICBtdXRhdGVfYXQodmFycyhlbmRzX3dpdGgoIl9jb3JyZWN0IiksIGVuZHNfd2l0aCgiX2luY29ycmVjdCIpKSwKICAgICAgICAgICAgICB+IGlmZWxzZShpcy5uYShwcmVkaWN0ZWRfbGFiZWxzKSAmICFpcy5uYSguKSwgRkFMU0UsIC4pKSAlPiUKICAgIG11dGF0ZShxdWVyeV9icCA9IGJwICogMWUzKQogIAogIHJldHVybihiYXJjb2RlX3JlcykKfQpgYGAKCgpOb3cgd2UgY2FuIGFwcGx5IHRoaXMgZnVuY3Rpb24gdG8gYWxsIG9mIG91ciByZXN1bHRzOgoKYGBge3J9CnJlc3VsdHNfYmFyY29kZXMgPSBwdXJycjo6bWFwX2RmcihjKDEwLDIwLDUwLDEwMCwyMDApLHJlYWRfdHJhZGl0aW9uYWxfYmFyY29kZXMpCnJlc3VsdHNfYmFyY29kZXMKYGBgCgpOb3cgbGV0J3Mgc3VtbWFyaXNlIGZvciBlYWNoIG1hcmtlciBzZXBhcmF0ZWx5OgpgYGB7cn0KYmFyY29kZV9zdW1tYXJ5X2ZhbWlseSA9IHNwbGl0KHJlc3VsdHNfYmFyY29kZXMscmVzdWx0c19iYXJjb2RlcyRtYXJrZXIpICU+JQogIHB1cnJyOjptYXBfZGZyKH5zdW1tYXJpemVfcmVzdWx0cygueCwnZmFtaWx5JyksLmlkPSdtYXJrZXInKQoKYmFyY29kZV9zdW1tYXJ5X2ZhbWlseQpgYGAKCmBgYHtyfQpiYXJjb2RlX3N1bW1hcnlfZ2VudXMgPSBzcGxpdChyZXN1bHRzX2JhcmNvZGVzLHJlc3VsdHNfYmFyY29kZXMkbWFya2VyKSAlPiUKICBwdXJycjo6bWFwX2Rmcih+c3VtbWFyaXplX3Jlc3VsdHMoLngsJ2dlbnVzJyksLmlkPSdtYXJrZXInKQoKYmFyY29kZV9zdW1tYXJ5X2dlbnVzCmBgYAoKYGBge3J9CmJhcmNvZGVfc3VtbWFyeV9zcGVjaWVzID0gc3BsaXQocmVzdWx0c19iYXJjb2RlcyxyZXN1bHRzX2JhcmNvZGVzJG1hcmtlcikgJT4lCiAgcHVycnI6Om1hcF9kZnIofnN1bW1hcml6ZV9yZXN1bHRzKC54LCdzcGVjaWVzJyksLmlkPSdtYXJrZXInKQoKYmFyY29kZV9zdW1tYXJ5X3NwZWNpZXMKYGBgCgpOb3cgbGV0J3MgcGxvdCwgbWFraW5nIHNlcGFyYXRlIHBsb3RzIGZvciBlYWNoIG1hcmtlcjoKClNwZWNpZXM6CmBgYHtyfQpwX2JhcmNvZGVfc3BlY2llcyA9IGJhcmNvZGVfc3VtbWFyeV9zcGVjaWVzICU+JQogIHNwbGl0KGJhcmNvZGVfc3VtbWFyeV9zcGVjaWVzJG1hcmtlcikgJT4lCiAgcHVycnI6Om1hcCh+cGxvdF9hcmVhKC54LHBhc3RlMCh1bmlxdWUoLngkbWFya2VyKSwnIHNwZWNpZXMnKSwgcmVsYXRpdmUgPSBUUlVFLCB4bGltX2FsbCA9IEZBTFNFKSkKCnBfYmFyY29kZV9zcGVjaWVzCmBgYApHZW5lcmE6CmBgYHtyfQpwX2JhcmNvZGVfZ2VudXMgPSBiYXJjb2RlX3N1bW1hcnlfZ2VudXMgJT4lCiAgc3BsaXQoYmFyY29kZV9zdW1tYXJ5X2dlbnVzJG1hcmtlcikgJT4lCiAgcHVycnI6Om1hcCh+cGxvdF9hcmVhKC54LHBhc3RlMCh1bmlxdWUoLngkbWFya2VyKSwnIGdlbnVzJyksIHJlbGF0aXZlID0gVFJVRSwgeGxpbV9hbGwgPSBGQUxTRSkpCgpwX2JhcmNvZGVfZ2VudXMKYGBgCkZhbWlseToKYGBge3J9CnBfYmFyY29kZV9mYW1pbHkgPSBiYXJjb2RlX3N1bW1hcnlfZmFtaWx5ICU+JQogIHNwbGl0KGJhcmNvZGVfc3VtbWFyeV9mYW1pbHkkbWFya2VyKSAlPiUKICBwdXJycjo6bWFwKH5wbG90X2FyZWEoLngscGFzdGUwKHVuaXF1ZSgueCRtYXJrZXIpLCcgZmFtaWx5JyksIHJlbGF0aXZlID0gVFJVRSx4bGltX2FsbCA9IEZBTFNFKSkKCnBfYmFyY29kZV9mYW1pbHkKYGBgCgojIyBDb25jYXRlbmF0ZWQgdHJlZQpOb3cgd2Ugd2lsbCBkbyB0aGUgc2FtZSBmb3IgY29uY2F0ZW5hdGVkIHRyZWUuIExldCdzIHN0YXJ0IGJ5IGRlZmluaW5nIGEgZnVuY3Rpb24gdG8gZ2F0aGVyIHJlc3VsdHMuIFdlIHdpbGwgY29uc2lkZXIgYSByZXN1bHQgYXMgY29ycmVjdCBpZiB0aGUgbWFqb3JpdHkgb2YgdGhlIHNpc3RlciB0YXhvbiB0byBhIHRpcCBoYXMgdGhlIHNhbWUgbGFiZWwuCgoKYGBge3J9CgpyZWFkX2NvbmNhdGVuYXRlZF90cmVlX3Jlc3VsdHMgPSBmdW5jdGlvbihicCl7CiAgCiAgCiMgUmVhZCBpbiB5b3VyIHRyZWUgLSByZXBsYWNlICd5b3VyX3RyZWVfZmlsZS5ud2snIHdpdGggdGhlIHBhdGggdG8geW91ciB0cmVlIGZpbGUKdHJlZSA9IHJlYWQudHJlZShwYXN0ZTAoJ01hbHBpZ2hpYWNlYWUrQ2hyeXNvYmFsYW5hY2VhZS90cmFkaXRpb25hbF9iYXJjb2Rlcy8yX2JsYXN0X3BoeWxvZ2VueV9yZXN1bHQvR2VudXMvY29uYy4nLGJwLCdtLnNwbmFtZS50cmUnKSkKCiNsZWF2ZSBvbmx5IHNhbXBsZSBJRHMgYXMgdGlwIGxhYmVscwp0cmVlJHRpcC5sYWJlbCA9IHRyZWUkdGlwLmxhYmVsICU+JSBzdHJfcmVtb3ZlKCIuKkAiKSAlPiUgc3RyX3JlbW92ZSgiJyIpICU+JSBzdHJfcmVwbGFjZSgnIHJlZicsJ19yZWYnKQoKIyBDb21wdXRlIHRoZSBwYXRyaXN0aWMgZGlzdGFuY2VzIGFuZCBsaXN0IGFsbCByZWZlcmVuY2UgbmFtZXMKcGF0cmlzdGljX2Rpc3RhbmNlcyA8LSBjb3BoZW5ldGljKHRyZWUpCmFsbF9yZWZfbmFtZXMgPSBkaW1uYW1lcyhwYXRyaXN0aWNfZGlzdGFuY2VzKVtbMV1dW3N0cl9kZXRlY3QoZGltbmFtZXMocGF0cmlzdGljX2Rpc3RhbmNlcylbWzFdXSwnX3JlZiQnKV0KYWxsX25vbnJlZiA9IGRpbW5hbWVzKHBhdHJpc3RpY19kaXN0YW5jZXMpW1sxXV1bc3RyX2RldGVjdChkaW1uYW1lcyhwYXRyaXN0aWNfZGlzdGFuY2VzKVtbMV1dLCdfcmVmJCcsbmVnYXRlID0gVFJVRSldCgojIEZvciBlYWNoIHRpcCwgZmluZCB0aGUgcmVmZXJlbmNlIHNhbXBsZSB3aXRoIGNsb3Nlc3QgcGF0cmlzdGljIGRpc3RhbmNlCmZpbmRfY2xvc2VzdCA9IGZ1bmN0aW9uKHRpcCl7CiAgdG9fa2VlcCA9IGModGlwLGFsbF9yZWZfbmFtZXNbc3RyX2RldGVjdChhbGxfcmVmX25hbWVzLHBhc3RlMCh0aXAsJ19yZWYnKSxuZWdhdGUgPSBUUlVFKV0pCiAgcmV0dXJuKG5hbWVzKHNvcnQocGF0cmlzdGljX2Rpc3RhbmNlc1t0aXAsdG9fa2VlcF0pWzJdKSAlPiUKICAgICAgICAgICBzdHJfcmVtb3ZlKCdfcmVmJykpCn0KCmNsb3Nlc3RfbWF0Y2ggPSBwdXJycjo6bWFwX2NocihhbGxfbm9ucmVmLGZpbmRfY2xvc2VzdCkKCnNhbXBsZXNfd2l0aF9kYXRhID0gcmVhZF9kZWxpbShwYXN0ZTAoJ01hbHBpZ2hpYWNlYWUrQ2hyeXNvYmFsYW5hY2VhZS90cmFkaXRpb25hbF9iYXJjb2Rlcy8yX2JsYXN0X3BoeWxvZ2VueV9yZXN1bHQvR2VudXMvJyxicCwnTV9ibGFzdF9waHlsb19zdW1fc3AudHN2JykpICU+JSAKICBzZWxlY3Qoc2FtcGxlX2lkPXNwKSAlPiUKICBtdXRhdGUoc2FtcGxlX2lkID0gc3RyX3JlbW92ZV9hbGwoc2FtcGxlX2lkLCAnQC4rJykpCgpiYXJjb2RlX3JlcyA9IHRpYmJsZShzYW1wbGVfaWQgPSBhbGxfbm9ucmVmLAogICAgICAgY2xvc2VzdF9yZWZlcmVuY2Vfc2FtcGxlX2lkID0gY2xvc2VzdF9tYXRjaCkgJT4lCiAgcmlnaHRfam9pbihzYW1wbGVzX3dpdGhfZGF0YSkgJT4lCiAgbXV0YXRlKAogICAgICBwcmVkaWN0ZWRfbGFiZWxzID0gc2FtcF9sYWJlbHMkYWN0dWFsX2xhYmVsc1ttYXRjaChjbG9zZXN0X3JlZmVyZW5jZV9zYW1wbGVfaWQsIHNhbXBfbGFiZWxzJHNhbXBsZV9pZCldLAogICAgICBhY3R1YWxfbGFiZWxzID0gc2FtcF9sYWJlbHMkYWN0dWFsX2xhYmVsc1ttYXRjaChzYW1wbGVfaWQsIHNhbXBfbGFiZWxzJHNhbXBsZV9pZCldCiAgICApICU+JQogIGZpbHRlcihzYW1wbGVfaWQhPScyMDk1JykgJT4lCiAgbXV0YXRlKAogICAgICBxdWVyeV9sYWJlbHMgPSBzdHJfcmVtb3ZlKGFjdHVhbF9sYWJlbHMsICI7Kmxvd19xdWFsaXR5OlRydWU7KiIpICU+JSBzdHJfc3BsaXQoJzsnKSwKICAgICAgcHJlZGljdGVkX2xpc3QgPSBzdHJfc3BsaXQocHJlZGljdGVkX2xhYmVscywgJzsnKQogICAgKSAlPiUKICAgIHJvd3dpc2UoKSAlPiUKICAgIG11dGF0ZSgKICAgICAgZmFtaWx5X2NvcnJlY3QgPSBxdWVyeV9sYWJlbHNbc3RyX2RldGVjdChxdWVyeV9sYWJlbHMsICdmYW1pbHknKV0gJWluJSBwcmVkaWN0ZWRfbGlzdCwKICAgICAgZ2VudXNfY29ycmVjdCA9IHF1ZXJ5X2xhYmVsc1tzdHJfZGV0ZWN0KHF1ZXJ5X2xhYmVscywgJ2dlbnVzJyldICVpbiUgcHJlZGljdGVkX2xpc3QsCiAgICAgIHNwZWNpZXNfY29ycmVjdCA9IGlmZWxzZShhbnkoc3RyX2RldGVjdCgKICAgICAgICBxdWVyeV9sYWJlbHMsICdzcGVjaWVzJwogICAgICApKSwKICAgICAgcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCAnc3BlY2llcycpXSAlaW4lIHByZWRpY3RlZF9saXN0LAogICAgICBOQSksCiAgICAgIGZhbWlseV9pbmNvcnJlY3QgPSBhbnkoIShwcmVkaWN0ZWRfbGlzdFtzdHJfZGV0ZWN0KHByZWRpY3RlZF9saXN0LCAnZmFtaWx5JyldICVpbiUgcXVlcnlfbGFiZWxzW3N0cl9kZXRlY3QocXVlcnlfbGFiZWxzLCAnZmFtaWx5JyldKSksCiAgICAgIGdlbnVzX2luY29ycmVjdCA9IGFueSghKHByZWRpY3RlZF9saXN0W3N0cl9kZXRlY3QocHJlZGljdGVkX2xpc3QsICdnZW51cycpXSAlaW4lIHF1ZXJ5X2xhYmVsc1tzdHJfZGV0ZWN0KHF1ZXJ5X2xhYmVscywgJ2dlbnVzJyldKSksCiAgICAgIHNwZWNpZXNfaW5jb3JyZWN0ID0gaWZlbHNlKGFueShzdHJfZGV0ZWN0KAogICAgICAgIHF1ZXJ5X2xhYmVscywgJ3NwZWNpZXMnCiAgICAgICkpLAogICAgICBhbnkoISgKICAgICAgICBwcmVkaWN0ZWRfbGlzdFtzdHJfZGV0ZWN0KHByZWRpY3RlZF9saXN0LCAnc3BlY2llcycpXSAlaW4lIHF1ZXJ5X2xhYmVsc1tzdHJfZGV0ZWN0KHF1ZXJ5X2xhYmVscywgJ3NwZWNpZXMnKV0KICAgICAgKSksCiAgICAgIE5BKQogICAgKSAlPiUKICAgIG11dGF0ZV9hdCh2YXJzKGVuZHNfd2l0aCgiX2NvcnJlY3QiKSwgZW5kc193aXRoKCJfaW5jb3JyZWN0IikpLAogICAgICAgICAgICAgIH4gaWZlbHNlKGlzLm5hKHByZWRpY3RlZF9sYWJlbHMpICYgIWlzLm5hKC4pLCBGQUxTRSwgLikpICU+JQogICAgbXV0YXRlKHF1ZXJ5X2JwID0gYnAgKiAxZTMpCiAgCiAgcmV0dXJuKGJhcmNvZGVfcmVzKQp9CgpgYGAKCk5vdyBsZXQncyBhcHBseSB0aGlzIGZ1bmN0aW9uCmBgYHtyfQpyZXN1bHRzX2NvbmNhdF9iYXJjb2RlcyA9IHB1cnJyOjptYXBfZGZyKGMoMTAsMjAsNTAsMTAwLDIwMCkscmVhZF9jb25jYXRlbmF0ZWRfdHJlZV9yZXN1bHRzKQpyZXN1bHRzX2NvbmNhdF9iYXJjb2RlcwpgYGAKTGV0J3Mgc3VtbWFyaXplIHJlc3VsdHMgYW5kIHBsb3QgZm9yIGdlbnVzLCBzcGVjaWVzIGFuZCBmYW1pbHkgYWNjdXJhY3kKCmBgYHtyfQpjb25jYXRfc3VtbWFyeV9zcGVjaWVzID0gc3VtbWFyaXplX3Jlc3VsdHMocmVzdWx0c19jb25jYXRfYmFyY29kZXMsJ3NwZWNpZXMnKQpwX2NvbmNhdF9zcGVjaWVzID0gcGxvdF9hcmVhKGNvbmNhdF9zdW1tYXJ5X3NwZWNpZXMsIHJlbGF0aXZlID0gRkFMU0UsdGl0bGUgPSAnQ29uY2F0ZW5hdGVkIGJhcmNvZGVzIHNwZWNpZXMnLHhsaW1fYWxsID0gRkFMU0UpCnBfY29uY2F0X3NwZWNpZXMKYGBgCmBgYHtyfQpjb25jYXRfc3VtbWFyeV9nZW51cyA9IHN1bW1hcml6ZV9yZXN1bHRzKHJlc3VsdHNfY29uY2F0X2JhcmNvZGVzLCdnZW51cycpCnBfY29uY2F0X2dlbnVzID0gcGxvdF9hcmVhKGNvbmNhdF9zdW1tYXJ5X2dlbnVzLCByZWxhdGl2ZSA9IFRSVUUsdGl0bGUgPSAnQ29uY2F0ZW5hdGVkIGJhcmNvZGVzIGdlbnVzJyx4bGltX2FsbCA9IFRSVUUpCnBfY29uY2F0X2dlbnVzCmBgYAoKYGBge3J9CmNvbmNhdF9zdW1tYXJ5X2ZhbWlseSA9IHN1bW1hcml6ZV9yZXN1bHRzKHJlc3VsdHNfY29uY2F0X2JhcmNvZGVzLCdmYW1pbHknKQpwX2NvbmNhdF9mYW1pbHkgPSBwbG90X2FyZWEoY29uY2F0X3N1bW1hcnlfZmFtaWx5LCByZWxhdGl2ZSA9IFRSVUUsdGl0bGUgPSAnQ29uY2F0ZW5hdGVkIGJhcmNvZGVzIGZhbWlseScseGxpbV9hbGwgPSBGQUxTRSkKcF9jb25jYXRfZmFtaWx5CmBgYAoKCgoKIyBEaXJlY3QgY29tcGFyaXNvbgoKTm93IGxldCdzIGNvbXBhcmUgbWV0aG9kcyBzaWRlIGJ5IHNpZGUuIEZvciBnZW51cyBsZXZlbDoKYGBge3IgZmlnLmhlaWdodD0xMH0KcDEgPSBwYXRjaHdvcms6OndyYXBfcGxvdHMocF9nZW51cyArIHRoZW1lKGF4aXMudGV4dC54ID0gZWxlbWVudF9ibGFuaygpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgYXhpcy50aXRsZS54ID0gZWxlbWVudF9ibGFuaygpKSwgCiAgICAgICAgICAgICAgICAgICBwX3NrbWVyX2dlbnVzLCBuY29sID0gMSkgCnAyID0gcGF0Y2h3b3JrOjp3cmFwX3Bsb3RzKHBfYmFyY29kZV9nZW51cyRJVFMgKyB0aGVtZShsZWdlbmQucG9zaXRpb24gPSAnbm9uZScpLAogICAgICAgICAgICAgICAgICAgcF9iYXJjb2RlX2dlbnVzJHJiY0wgKyB0aGVtZShsZWdlbmQucG9zaXRpb24gPSAnbm9uZScsIAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBheGlzLnRpdGxlLnkgPSBlbGVtZW50X2JsYW5rKCksCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGF4aXMudGV4dC55ID0gZWxlbWVudF9ibGFuaygpKSwKICAgICAgICAgICAgICAgICAgIHBfY29uY2F0X2dlbnVzICsgdGhlbWUoYXhpcy50aXRsZS55ID0gZWxlbWVudF9ibGFuaygpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBheGlzLnRleHQueSA9IGVsZW1lbnRfYmxhbmsoKSksCiAgICAgICAgICAgICAgICAgICBucm93ID0gMSkKcCA9IHBhdGNod29yazo6d3JhcF9wbG90cyhwMSxwMixuY29sPTEsaGVpZ2h0cyA9IGMoMC43LDAuMykpICsKICBwbG90X2Fubm90YXRpb24odGl0bGUgPSAnR2VudXMtbGV2ZWwgYWNjdXJhY3knKQpwCmdnc2F2ZSgnaW1hZ2VzX21hbnVzY3JpcHQvZmlnM19nZW51c19hY2N1cmFjeS5wZGYnLCB3aWR0aD01LGhlaWdodCA9IDEwKQpnZ3NhdmUoJ2ltYWdlc19tYW51c2NyaXB0L2ZpZzNfZ2VudXNfYWNjdXJhY3kucG5nJywgd2lkdGg9NSxoZWlnaHQgPSAxMCxkcGk9MTIwMCkKYGBgCk5vdyBmb3Igc3BlY2llcyBsZXZlbDoKYGBge3IgZmlnLmhlaWdodCA9IDEwfQpwMSA9IHBhdGNod29yazo6d3JhcF9wbG90cyhwX3NwZWNpZXMgKyB0aGVtZShheGlzLnRleHQueCA9IGVsZW1lbnRfYmxhbmsoKSwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGF4aXMudGl0bGUueCA9IGVsZW1lbnRfYmxhbmsoKSksIAogICAgICAgICAgICAgICAgICAgcF9za21lcl9zcGVjaWVzLCBuY29sID0gMSkgCnAyID0gcGF0Y2h3b3JrOjp3cmFwX3Bsb3RzKHBfYmFyY29kZV9zcGVjaWVzJElUUyArIHRoZW1lKGxlZ2VuZC5wb3NpdGlvbiA9ICdub25lJyksCiAgICAgICAgICAgICAgICAgICBwX2JhcmNvZGVfc3BlY2llcyRyYmNMICsgdGhlbWUobGVnZW5kLnBvc2l0aW9uID0gJ25vbmUnLCAKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgYXhpcy50aXRsZS55ID0gZWxlbWVudF9ibGFuaygpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBheGlzLnRleHQueSA9IGVsZW1lbnRfYmxhbmsoKSksCiAgICAgICAgICAgICAgICAgICBwX2NvbmNhdF9zcGVjaWVzICsgdGhlbWUoYXhpcy50aXRsZS55ID0gZWxlbWVudF9ibGFuaygpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBheGlzLnRleHQueSA9IGVsZW1lbnRfYmxhbmsoKSksCiAgICAgICAgICAgICAgICAgICBucm93ID0gMSkKcCA9IHBhdGNod29yazo6d3JhcF9wbG90cyhwMSxwMixuY29sPTEsaGVpZ2h0cyA9IGMoMC43LDAuMykpICsKICBwbG90X2Fubm90YXRpb24odGl0bGUgPSAnc3BlY2llcy1sZXZlbCBhY2N1cmFjeScpCnAKZ2dzYXZlKCdpbWFnZXNfbWFudXNjcmlwdC9maWczX3NwZWNpZXNfYWNjdXJhY3kucGRmJywgd2lkdGg9NSxoZWlnaHQgPSAxMCkKZ2dzYXZlKCdpbWFnZXNfbWFudXNjcmlwdC9maWczX3NwZWNpZXNfYWNjdXJhY3kucG5nJywgd2lkdGg9NSxoZWlnaHQgPSAxMCxkcGk9MTIwMCkKYGBgCk5vdyBmb3IgZmFtaWx5IGxldmVsOgpgYGB7ciBmaWcuaGVpZ2h0ID0gMTB9CnAxID0gcGF0Y2h3b3JrOjp3cmFwX3Bsb3RzKHBfZmFtaWx5ICsgdGhlbWUoYXhpcy50ZXh0LnggPSBlbGVtZW50X2JsYW5rKCksCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBheGlzLnRpdGxlLnggPSBlbGVtZW50X2JsYW5rKCkpLCAKICAgICAgICAgICAgICAgICAgIHBfc2ttZXJfZmFtaWx5LCBuY29sID0gMSkgCnAyID0gcGF0Y2h3b3JrOjp3cmFwX3Bsb3RzKHBfYmFyY29kZV9mYW1pbHkkSVRTICsgdGhlbWUobGVnZW5kLnBvc2l0aW9uID0gJ25vbmUnKSwKICAgICAgICAgICAgICAgICAgIHBfYmFyY29kZV9mYW1pbHkkcmJjTCArIHRoZW1lKGxlZ2VuZC5wb3NpdGlvbiA9ICdub25lJywgCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGF4aXMudGl0bGUueSA9IGVsZW1lbnRfYmxhbmsoKSwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgYXhpcy50ZXh0LnkgPSBlbGVtZW50X2JsYW5rKCkpLAogICAgICAgICAgICAgICAgICAgcF9iYXJjb2RlX2ZhbWlseSRtYXRLICsgdGhlbWUoYXhpcy50aXRsZS55ID0gZWxlbWVudF9ibGFuaygpLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBheGlzLnRleHQueSA9IGVsZW1lbnRfYmxhbmsoKSksCiAgICAgICAgICAgICAgICAgICBucm93ID0gMSkKcCA9IHBhdGNod29yazo6d3JhcF9wbG90cyhwMSxwMixuY29sPTEsaGVpZ2h0cyA9IGMoMC43LDAuMykpICsKICBwbG90X2Fubm90YXRpb24odGl0bGUgPSAnZmFtaWx5LWxldmVsIGFjY3VyYWN5JykKcApnZ3NhdmUoJ2ltYWdlc19tYW51c2NyaXB0L2ZpZzNfZmFtaWx5X2FjY3VyYWN5LnBkZicsIHdpZHRoPTUsaGVpZ2h0ID0gMTApCmdnc2F2ZSgnaW1hZ2VzX21hbnVzY3JpcHQvZmlnM19mYW1pbHlfYWNjdXJhY3kucG5nJywgd2lkdGg9NSxoZWlnaHQgPSAxMCxkcGk9MTIwMCkKYGBgCgojIENvbXBhcmlzb24gb2YgcnVuIHRpbWVzCgpOb3cgbGV0J3MgY29tcGFyZSB0aGUgdGltZSB0byBwcm9kdWNlIHJlZmVyZW5jZXMgYW5kIHRvIHByb2R1Y2UgCgojIFNSQQoKRmluYWxseSwgbGV0J3Mgc3VtbWFyaXplIHJlc3VsdHMgZm9yIHRoZSB3aG9sZSBTUkEgZGF0YXNldC4gSW4gdGhpcyBjYXNlLCB3ZSBvbmx5IGhhdmUgdmFyS29kZXIgc2luY2UgU2ttZXIgY2Fubm90IGZpbmlzaCBhbmQgdHJhZGl0aW9uYWwgYmFyY29kZXMgYXJlIGluYXBwbGljYWJsZS4KCmBgYHtyfQp2YXJLb2Rlcl9TUkFfcmVzdWx0cyAgPSByZWFkX2NzdignYWxsX1NSQS92YXJrb2Rlcl9xdWVyeV9yZXN1bHRzL3ByZWRpY3Rpb25zLmNzdicpICU+JQpzZWxlY3QoLTEpICU+JQogIGZpbHRlcihzdHJfZGV0ZWN0KHF1ZXJ5X2Jhc2VwYWlycywnXjArWzEyNV0wK0skJykpICU+JSAjd2Ugd2lsbCBpZ25vcmUgcXVlcmllcyB0aGF0IGFyZSBub3Qgc3RhbmRhcmRpemVkIHNpemVzCiAgcmVuYW1lKHF1ZXJ5X2JwID0gcXVlcnlfYmFzZXBhaXJzKSAlPiUKICBtdXRhdGUocXVhbGl0eV9pbmNsdWRlZCA9IFQpCnBsYW4oc2VxdWVudGlhbCkKClNSQV90YXhsYWJlbHMgPSBzdHJfcmVtb3ZlKHZhcktvZGVyX1NSQV9yZXN1bHRzJGFjdHVhbF9sYWJlbHMsIjsqbG93X3F1YWxpdHk6VHJ1ZTsqIikgJT4lIHN0cl9zcGxpdCgnOycpICU+JSB1bmxpc3QgJT4lIHVuaXF1ZQoKdmFyS29kZXJfU1JBX3Jlc3VsdHMgPSB2YXJLb2Rlcl9TUkFfcmVzdWx0cyAlPiUKICBtdXRhdGUocXVlcnlfbGFiZWxzID0gc3RyX3JlbW92ZShhY3R1YWxfbGFiZWxzLCI7Kmxvd19xdWFsaXR5OlRydWU7KiIpICU+JSBzdHJfc3BsaXQoJzsnKSAlPiUgdW5saXN0LAogICAgICAgICBwcmVkaWN0ZWRfbGlzdCA9IHN0cl9zcGxpdChwcmVkaWN0ZWRfbGFiZWxzLCc7JykKICAgICAgICAgKSAlPiUKICByb3d3aXNlKCkgJT4lCiAgbXV0YXRlKGZhbWlseV9jb3JyZWN0ID0gcXVlcnlfbGFiZWxzICVpbiUgcHJlZGljdGVkX2xpc3QsCiAgICAgICAgIGZhbWlseV9pbmNvcnJlY3QgPSBpZmVsc2UoaXMubmEocHJlZGljdGVkX2xhYmVscyksRkFMU0UsYW55KCEocHJlZGljdGVkX2xpc3QgJWluJSBxdWVyeV9sYWJlbHMpKSkpICU+JQogc2VsZWN0KG1hdGNoZXMoIl5bXjAtOV0iKSkKCnZhcktvZGVyX1NSQV9yZXN1bHRzIAogICAgICAgICAKYGBgCgpOb3cgbGV0J3Mgc3VtbWFyaXplIGFuZCBwbG90OgoKYGBge3J9ClNSQV9zdW1tYXJ5X2ZhbWlseSA9IHN1bW1hcml6ZV9yZXN1bHRzKHZhcktvZGVyX1NSQV9yZXN1bHRzLCdmYW1pbHknKQpTUkFfc3VtbWFyeV9mYW1pbHkKCk5fc2FtcCA9IFNSQV9zdW1tYXJ5X2ZhbWlseSAlPiUKIGdyb3VwX2J5KHF1ZXJ5X2JwKSAlPiUKIHN1bW1hcmlzZShOID0gc3VtKE4pKQoKcF9TUkFfZmFtaWx5ID0gcGxvdF9hcmVhKFNSQV9zdW1tYXJ5X2ZhbWlseSwgJ3ZhcktvZGVyIFNSQSBmYW1pbHknLCByZWxhdGl2ZSA9IFRSVUUpIApwX1NSQV9mYW1pbHkgCmBgYAoKTGV0J3Mgbm93IGRvIHRoZSBTUkEgcGxvdCwgYnV0IHNwbGl0dGluZyBieSBraW5nZG9tLiBGaXJzdCwgd2UgbmVlZCB0byByZXRyaWV2ZSBraW5nZG9tIGluZm9ybWF0aW9uOgpgYGB7cn0KCnBfU1JBX2ZhbWlsaWVzID0gcmVhZF9jc3YoJ2FsbF9TUkEvcnVuc190b19kb3dubG9hZF9kYXRhLmNzdicpICU+JQogIHNlbGVjdChzYW1wbGVfaWQgPSBSdW4sIEtpbmdkb20pICU+JQogIHJpZ2h0X2pvaW4odmFyS29kZXJfU1JBX3Jlc3VsdHMpICU+JQogIHNwbGl0KC4kS2luZ2RvbSkgJT4lCiAgcHVycnI6Om1hcChzdW1tYXJpemVfcmVzdWx0cywgCiAgICAgICAgICAgICAgICAgbGV2ZWw9J2ZhbWlseScpICU+JQogIHB1cnJyOjppbWFwKH5wbG90X2FyZWEoLngsLnkscmVsYXRpdmU9VFJVRSkgKyBjb29yZF9jYXJ0ZXNpYW4oeGxpbT1jKDUwMCwxMDAwMCkqMTAwMCxleHBhbmQgPSBGQUxTRSkpCgpwX1NSQV9mYW1pbGllcwpgYGAKCk5vdyBsZXQncyBqb2luIHRvIGNyZWF0ZSBhIHBsb3QgZm9yIHB1YmxpY2F0aW9uOgoKYGBge3J9CnJlbW92ZV95X2F4aXNfYW5kX3NjYWxlID0gZnVuY3Rpb24oeCl7CiAgeCArCiAgICB0aGVtZShheGlzLnRpdGxlLnkgPSBlbGVtZW50X2JsYW5rKCksCiAgICAgICAgICBheGlzLnRleHQueSA9IGVsZW1lbnRfYmxhbmsoKSwKICAgICAgICAgIGF4aXMudGlja3MueSA9IGVsZW1lbnRfYmxhbmsoKSwKICAgICAgICAgIGxlZ2VuZC5wb3NpdGlvbj0nbm9uZScsCiAgICAgICAgICBheGlzLnRpdGxlLnggPSBlbGVtZW50X2JsYW5rKCkpCn0KCiMgTW9kaWZ5IHRoZSBsYXN0IHBsb3QgdG8gaGF2ZSB0aGUgeC1heGlzIGxhYmVsCnBfU1JBX2ZhbWlsaWVzJEZ1bmdpIDwtIHBfU1JBX2ZhbWlsaWVzJEZ1bmdpICsgbGFicyh4ID0gIkJhc2UgcGFpcnMgaW4gcXVlcnkgaW1hZ2VzIikKCiMgQ29tYmluZSBwbG90cwpwX2NvbWJpbmVkIDwtIHdyYXBfcGxvdHMocF9TUkFfZmFtaWxpZXMkTWV0YXpvYSArIAogICAgICAgICAgICAgICAgICAgICAgICAgICB0aGVtZShsZWdlbmQucG9zaXRpb24gPSAnbm9uZScsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGF4aXMudGl0bGUueCA9IGVsZW1lbnRfYmxhbmsoKSksCiAgICAgICAgICAgICAgICAgICAgICAgICByZW1vdmVfeV9heGlzX2FuZF9zY2FsZShwX1NSQV9mYW1pbGllcyRWaXJpZGlwbGFudGFlKSwKICAgICAgICAgICAgICAgICAgICAgICAgIHJlbW92ZV95X2F4aXNfYW5kX3NjYWxlKHBfU1JBX2ZhbWlsaWVzJEZ1bmdpKSwKICAgICAgICAgICAgICAgICAgICAgICAgIG5yb3cgPSAxKQoKIyBBZGQgdGl0bGUgYW5kIHNldCBsYXlvdXQKIyBDcmVhdGUgYSBibGFuayBnZ3Bsb3Qgb2JqZWN0IHdpdGggdGhlIGRlc2lyZWQgeC1heGlzIHRpdGxlCnhfdGl0bGVfcGxvdCA8LSBnZ3Bsb3QoKSArIAogIHRoZW1lX3ZvaWQoKSArIAogIGxhYnMoeCA9ICJCYXNlIHBhaXJzIGluIHF1ZXJ5IGltYWdlcyIpICsKICB0aGVtZShwbG90Lm1hcmdpbiA9IG1hcmdpbigwLCAwLCAwLCAwKSwKICAgICAgICBheGlzLnRpdGxlLnggPSBlbGVtZW50X3RleHQoc2l6ZSA9IDEwLCBoanVzdCA9IDAuNSkpCgoKcCA9IHdyYXBfcGxvdHMocF9jb21iaW5lZCwgeF90aXRsZV9wbG90LG5jb2w9MSxoZWlnaHRzID0gYygwLjk1LDAuMDUpKQogICAgCiAgCgpwcmludChwKQoKCmdnc2F2ZSgnaW1hZ2VzX21hbnVzY3JpcHQvZmlnM19TUkFfYWNjdXJhY3kucGRmJywgd2lkdGg9NC41LGhlaWdodCA9IDQpCmdnc2F2ZSgnaW1hZ2VzX21hbnVzY3JpcHQvZmlnM19TUkFfYWNjdXJhY3kucG5nJywgd2lkdGg9NC41LGhlaWdodCA9IDQsZHBpID0gMTIwMCkKYGBgCgoKCiMgR2VuZXJhdGluZyBudW1iZXJzIGZvciBwdWJsaWNhdGlvbgoKSGVyZSB3ZSBqdXN0IHF1ZXJ5IG91ciByZXN1bHRzIHRvIGdldCBhIGZldyBmaWd1cmVzIHRoYXQgd2UgcmVwb3J0IGluIHRoZSBwYXBlci4KClRvdGFsIG51bWJlciBvZiBzYW1wbGVzIHVzZWQgaW4gY3Jvc3MtdmFsaWRhdGlvbjoKYGBge3J9CmRpbShzYW1wX2xhYmVscykKYGBgCgpOdW1iZXIgb2YgU3RpZ21hcGh5bGxvbiBzYW1wbGVzIHdpdGggZWFjaCBraW5kIG9mIGVycm9yIGZvciB2YXJrb2RlcjoKYGBge3J9CnN1bW1hcnlfc3BlY2llcwpgYGAKCk51bWJlciBvZiBTdGlnbWFwaHlsbG9uIHNhbXBsZXMgd2l0aCBlYWNoIGtpbmQgb2YgZXJyb3IgZm9yIHNrbWVyOgpgYGB7cn0Kc2ttZXJfc3VtbWFyeV9zcGVjaWVzCmBgYAp2YXJLb2RlciBhY2N1cmFjeSBmb3IgZ2VuZXJhOgpgYGB7cn0Kc3VtbWFyeV9nZW51cwpgYGAKdmFyS29kZXIgYWNjdXJhY3kgZm9yIGZhbWlseToKYGBge3J9CnN1bW1hcnlfZmFtaWx5CmBgYAoKCgpTa21lciBhY2N1cmFjeSBmb3IgZ2VuZXJhOgpgYGB7cn0Kc2ttZXJfc3VtbWFyeV9nZW51cwpgYGAKClNrbWVyIGFjY3VyYWN5IGZvciBmYW1pbHk6CmBgYHtyfQpza21lcl9zdW1tYXJ5X2ZhbWlseQpgYGAKCgpOdW1iZXIgb2Ygc2FtcGxlcyBhdmFpbGFibGUgZm9yIGVhY2ggZ2VudXMgYW5kIGRhdGEgYW1vdW50CmBgYHtyfQpyZXN1bHRzICU+JQogIG11dGF0ZShnZW51cyA9IHN0cl9leHRyYWN0KGFjdHVhbF9sYWJlbHMsIig/PD1nZW51czopW147XSsiKSkgJT4lCiAgZ3JvdXBfYnkocXVlcnlfYnApICU+JQogIHN1bW1hcml6ZShOPW4oKSkgJT4lCiAgY29tcGxldGUoKQpgYGAKUGxvdCBudW1iZXIgb2Ygc2FtcGxlcyBmb3Igc3VwcGxlbWVudGFyeSBtYXRlcmlhbC4KCmBgYHtyfQpuX3NhbXBsZXNfZ2VuZXJhID0gcmVzdWx0cyAlPiUKICBtdXRhdGUodGF4b24gPSBzdHJfZXh0cmFjdChhY3R1YWxfbGFiZWxzLCIoPzw9Z2VudXM6KVteO10rIikpICU+JQogIGdyb3VwX2J5KHRheG9uLCBxdWVyeV9icCkgJT4lCiAgc3VtbWFyaXplKE49bigpKSAlPiUKICB1bmdyb3VwKCkgJT4lCiAgY29tcGxldGUodGF4b24sIHF1ZXJ5X2JwLCBmaWxsID0gbGlzdChOPTApKQpuX3NhbXBsZXNfZ2VuZXJhIAoKbl9zYW1wbGVzX3NwZWNpZXMgPSByZXN1bHRzICU+JQogIG11dGF0ZSh0YXhvbiA9IHN0cl9leHRyYWN0KGFjdHVhbF9sYWJlbHMsIig/PD1zcGVjaWVzOilbXjtdKyIpKSAlPiUKICBmaWx0ZXIoIWlzLm5hKHRheG9uKSkgJT4lCiAgZ3JvdXBfYnkodGF4b24sIHF1ZXJ5X2JwKSAlPiUKICBzdW1tYXJpemUoTj1uKCkpICU+JQogIHVuZ3JvdXAoKSAlPiUKICBjb21wbGV0ZSh0YXhvbiwgcXVlcnlfYnAsIGZpbGwgPSBsaXN0KE49MCkpCm5fc2FtcGxlc19zcGVjaWVzIAoKbl9zYW1wbGVzX1NSQSA9IHZhcktvZGVyX1NSQV9yZXN1bHRzICU+JQogIG11dGF0ZSh0YXhvbiA9IGFzLmNoYXJhY3RlcihhY3R1YWxfbGFiZWxzKSkgJT4lCiAgZ3JvdXBfYnkodGF4b24sIHF1ZXJ5X2JwKSAlPiUKICBzdW1tYXJpemUoTj1uKCkpICU+JQogIHVuZ3JvdXAoKSAlPiUKICBjb21wbGV0ZSh0YXhvbiwgcXVlcnlfYnAsIGZpbGwgPSBsaXN0KE49MCkpCm5fc2FtcGxlc19TUkEgCmBgYApgYGB7cn0KcGxvdF9Oc2FtcGxlc19hcmVhID0gZnVuY3Rpb24oZGYsIHRpdGxlKXsKICBkZiA9IGRmICU+JSAKICAgIG11dGF0ZShxdWVyeV9icCA9IHBhcnNlX251bWJlcihxdWVyeV9icCkgKjEwMDApCiAgCiAgbl9sZXZlbHMgPC0gbGVuZ3RoKHVuaXF1ZShkZiR0YXhvbikpCiAgdmlyaWRpc19jb2xvcnMgPC0gdmlyaWRpczo6dHVyYm8obl9sZXZlbHMpCiAgCiAgaGFsZl9uIDwtIGNlaWxpbmcobl9sZXZlbHMgLyAyKQogIHJlb3JkZXJlZF9jb2xvcnMgPC0gYyhyYmluZCh2aXJpZGlzX2NvbG9yc1sxOmhhbGZfbl0sIHZpcmlkaXNfY29sb3JzWyhoYWxmX24gKyAxKTpuX2xldmVsc10pKQoKCiAgCiAgCiAgZ2dwbG90KGRmLCBhZXMoeD1xdWVyeV9icCx5PU4sZmlsbD10YXhvbiwgY29sb3IgPSB0YXhvbiwgZ3JvdXAgPSB0YXhvbikpICsKICAgIGdlb21fYXJlYShwb3NpdGlvbj0gcG9zaXRpb25fc3RhY2soKSkgKwogICAgI2dlb21fbGluZShwb3NpdGlvbj0nc3RhY2snKSArCiAgICBzY2FsZV9maWxsX21hbnVhbCh2YWx1ZXMgPSByZW9yZGVyZWRfY29sb3JzLCAKICAgICAgICAgICAgICAgICAgICAgIGFlc3RoZXRpY3MgPSBjKCdjb2xvdXInLCdmaWxsJyksCiAgICAgICAgICAgICAgICAgICAgICBndWlkZSA9ICdub25lJykgKwogICAgc2NhbGVfeF9sb2cxMChsYWJlbHMgPSBzY2FsZXM6OmxhYmVsX251bWJlcihzY2FsZV9jdXQgPSBzY2FsZXM6OmN1dF9zaSgnYnAnKSksCiAgICAgICAgICAgICAgICAgIGJyZWFrcyA9IDEwMDAqcGFyc2VfbnVtYmVyKHVuaXF1ZShuX3NhbXBsZXNfZ2VuZXJhJHF1ZXJ5X2JwKSksCiAgICAgICAgICAgICAgICAgIGxpbWl0cyA9IDEwMDAqcmFuZ2UocGFyc2VfbnVtYmVyKHVuaXF1ZShuX3NhbXBsZXNfZ2VuZXJhJHF1ZXJ5X2JwKSkpKSAgKwogICAgc2NhbGVfeV9jb250aW51b3VzKG4uYnJlYWtzID0gMTAsIG1pbm9yX2JyZWFrcyA9IHdhaXZlcigpKSArCiAgICBnZ3RpdGxlKHRpdGxlKSArCiAgICB5bGFiKCdOdW1iZXIgb2Ygc2FtcGxlcycpICsKICAgIHhsYWIoJ0Jhc2UgcGFpcnMgaW4gcXVlcnkgaW1hZ2VzJykgKwogICAgdGhlbWVfZmV3KCkgKwogICAgdGhlbWUoYXhpcy50ZXh0LnggPSBlbGVtZW50X3RleHQoaGp1c3Q9MSxhbmdsZT00NSksCiAgICAgICAgICBwYW5lbC5iYWNrZ3JvdW5kID0gZWxlbWVudF9yZWN0KGZpbGwgPSBOQSksCiAgICAgICAgICAgIHBhbmVsLmdyaWQubWFqb3IueSA9IGVsZW1lbnRfbGluZShjb2xvdXIgPSBncmF5KDAuNSkpLAogICAgICAgICAgICBwYW5lbC5ncmlkLm1pbm9yLnkgPSBlbGVtZW50X2xpbmUoY29sb3VyID0gZ3JheSgwLjYpLGxpbmV0eXBlID0gMiksCiAgICAgICAgICAgIHBhbmVsLm9udG9wID0gVFJVRSkKfQpgYGAKCmBgYHtyfQpOX3NwZWNpZXMgPSBwbG90X05zYW1wbGVzX2FyZWEobl9zYW1wbGVzX3NwZWNpZXMsdGl0bGU9J1N0aWdtYXBoeWxsb24gU3BlY2llcycpCk5fZ2VuZXJhID0gcGxvdF9Oc2FtcGxlc19hcmVhKG5fc2FtcGxlc19nZW5lcmEsdGl0bGU9J01hcGxpZ2hpYWNlYWUgYW5kIENocnlzb2JhbGFuYWNlYWUgR2VuZXJhJykKTl9mYW1pbGllcyA9IHBsb3RfTnNhbXBsZXNfYXJlYShuX3NhbXBsZXNfU1JBLHRpdGxlPSdTUkEgZmFtaWxlcycpCgpjb3dwbG90OjpwbG90X2dyaWQoTl9nZW5lcmEsTl9zcGVjaWVzLE5fZmFtaWxpZXMsIG5yb3cgPSAxKQpgYGAKClRvdGFsIG51bWJlciBvZiBTUkEgc2FtcGxlcy4gVmFsaWRhdGlvbjoKYGBge3J9CnJlYWRfY3N2KCd2YXJLb2Rlci9hbGxfU1JBL3ZhcmtvZGVyX3RyYWluZWRfbW9kZWxfTUwvaW5wdXRfZGF0YS5jc3YnKVstMV0gJT4lCiAgZ3JvdXBfYnkoaXNfdmFsaWQpICU+JQogIHN1bW1hcmlzZShOID0gbigpKQpgYGAKCgoKCg==